From eca7e534fd28db6106a0489829b2453a82fc544c Mon Sep 17 00:00:00 2001 From: Michael Barry Date: Sun, 26 May 2024 06:50:50 -0400 Subject: [PATCH] Attach parquet schema to features (#897) --- .../reader/parquet/ParquetFeature.java | 18 +++++++++++++++++- .../reader/parquet/ParquetInputFile.java | 4 +++- 2 files changed, 20 insertions(+), 2 deletions(-) diff --git a/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetFeature.java b/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetFeature.java index 895fb9a662..22e01a229b 100644 --- a/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetFeature.java +++ b/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetFeature.java @@ -4,8 +4,10 @@ import com.onthegomap.planetiler.geo.GeometryException; import com.onthegomap.planetiler.reader.SourceFeature; import com.onthegomap.planetiler.reader.Struct; +import java.nio.file.Path; import java.util.List; import java.util.Map; +import org.apache.parquet.schema.MessageType; import org.locationtech.jts.geom.Geometry; import org.locationtech.jts.geom.Lineal; import org.locationtech.jts.geom.Polygonal; @@ -18,15 +20,29 @@ public class ParquetFeature extends SourceFeature { private final GeometryReader geometryParser; private final Object rawGeometry; + private final Path path; + private final MessageType schema; private Geometry latLon; private Geometry world; private Struct struct = null; ParquetFeature(String source, String sourceLayer, long id, GeometryReader geometryParser, - Map tags) { + Map tags, Path path, MessageType schema) { super(tags, source, sourceLayer, List.of(), id); this.geometryParser = geometryParser; this.rawGeometry = tags.remove(geometryParser.geometryColumn); + this.path = path; + this.schema = schema; + } + + /** Returns the parquet file that this feature was read from. */ + public Path path() { + return path; + } + + /** Returns the {@link MessageType} schema of the parquet file that this feature was read from. */ + public MessageType parquetSchema() { + return schema; } @Override diff --git a/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetInputFile.java b/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetInputFile.java index 393014b2b6..28f560729e 100644 --- a/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetInputFile.java +++ b/planetiler-core/src/main/java/com/onthegomap/planetiler/reader/parquet/ParquetInputFile.java @@ -180,7 +180,9 @@ public ParquetFeature next() { idGenerator != null ? idGenerator.applyAsLong(item) : Hashing.fnv1a64(blockHash, ByteBuffer.allocate(8).putLong(i).array()), geometryReader, - item + item, + path, + schema ); if (postFilterBounds != null) {