trinodb · jackye1995 · Nov 26, 2021 · findepi · Dec 1, 2021 · findepi
diff --git a/plugin/trino-hive/src/main/java/io/trino/plugin/hive/HdfsEnvironment.java b/plugin/trino-hive/src/main/java/io/trino/plugin/hive/HdfsEnvironment.java
@@ -27,13 +27,17 @@
 
 import javax.inject.Inject;
 
+import java.io.Externalizable;
 import java.io.IOException;
+import java.io.ObjectInput;
+import java.io.ObjectOutput;
 import java.util.Optional;
 
 import static com.google.common.base.MoreObjects.toStringHelper;
 import static java.util.Objects.requireNonNull;
 
 public class HdfsEnvironment
+        implements Externalizable
 {
     static {
         HadoopNative.requireHadoopNative();
@@ -102,7 +106,29 @@ public void doAs(ConnectorIdentity identity, Runnable action)
         hdfsAuthentication.doAs(identity, action);
     }
 
+    public HdfsEnvironment()
+    {
+        this.hdfsConfiguration = null;
+        this.hdfsAuthentication = null;
+        this.newDirectoryPermissions = null;
+        this.newFileInheritOwnership = false;
+        this.verifyChecksum = false;
+    }
+
+    @Override
+    public void writeExternal(ObjectOutput out)
+            throws IOException
+    {
+    }
+
+    @Override
+    public void readExternal(ObjectInput in)
+            throws IOException, ClassNotFoundException
+    {
+    }
+
     public static class HdfsContext
+            implements Externalizable
     {
         private final ConnectorIdentity identity;
 
@@ -130,5 +156,22 @@ public String toString()
                     .add("user", identity)
                     .toString();
         }
+
+        public HdfsContext()
+        {
+            identity = null;
+        }
+
+        @Override
+        public void writeExternal(ObjectOutput out)
+                throws IOException
+        {
+        }
+
+        @Override
+        public void readExternal(ObjectInput in)
+                throws IOException, ClassNotFoundException
+        {
+        }
     }
 }
diff --git a/plugin/trino-iceberg/pom.xml b/plugin/trino-iceberg/pom.xml
@@ -144,6 +144,12 @@
             </exclusions>
         </dependency>
 
+        <dependency>
+            <groupId>org.apache.iceberg</groupId>
+            <artifactId>iceberg-data</artifactId>
+            <version>${dep.iceberg.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.iceberg</groupId>
             <artifactId>iceberg-hive-metastore</artifactId>

diff --git a/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/CommitTaskData.java b/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/CommitTaskData.java
@@ -15,6 +15,7 @@
 
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.iceberg.FileContent;
 
 import java.util.Optional;
 
@@ -27,18 +28,21 @@ public class CommitTaskData
     private final long fileSizeInBytes;
     private final MetricsWrapper metrics;
     private final Optional<String> partitionDataJson;
+    private final FileContent content;
 
     @JsonCreator
     public CommitTaskData(
             @JsonProperty("path") String path,
             @JsonProperty("fileSizeInBytes") long fileSizeInBytes,
             @JsonProperty("metrics") MetricsWrapper metrics,
-            @JsonProperty("partitionDataJson") Optional<String> partitionDataJson)
+            @JsonProperty("partitionDataJson") Optional<String> partitionDataJson,
+            @JsonProperty("content") FileContent content)
     {
         this.path = requireNonNull(path, "path is null");
         this.fileSizeInBytes = fileSizeInBytes;
         this.metrics = requireNonNull(metrics, "metrics is null");
         this.partitionDataJson = requireNonNull(partitionDataJson, "partitionDataJson is null");
+        this.content = requireNonNull(content, "content is null");
         checkArgument(fileSizeInBytes >= 0, "fileSizeInBytes is negative");
     }
 
@@ -65,4 +69,10 @@ public Optional<String> getPartitionDataJson()
     {
         return partitionDataJson;
     }
+
+    @JsonProperty
+    public FileContent getContent()
+    {
+        return content;
+    }
 }
diff --git a/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergColumnHandle.java b/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergColumnHandle.java
@@ -25,11 +25,26 @@
 import java.util.Objects;
 import java.util.Optional;
 
+import static io.trino.plugin.iceberg.ColumnIdentity.primitiveColumnIdentity;
+import static io.trino.spi.type.BigintType.BIGINT;
 import static java.util.Objects.requireNonNull;
+import static org.apache.iceberg.MetadataColumns.IS_DELETED;
+import static org.apache.iceberg.MetadataColumns.ROW_POSITION;
 
 public class IcebergColumnHandle
         implements ColumnHandle
 {
+    public static final IcebergColumnHandle ROW_POSITION_HANDLE = new IcebergColumnHandle(
+            primitiveColumnIdentity(ROW_POSITION.fieldId(), ROW_POSITION.name()),
+            BIGINT,
+            ImmutableList.of(),
+            BIGINT,
+            Optional.empty());
+
+    // use Integer.MIN_VALUE as $row_id field ID, which is currently not reserved by Iceberg
+    public static final int TRINO_ROW_ID_COLUMN_ID = Integer.MIN_VALUE;
+    public static final String TRINO_ROW_ID_COLUMN_NAME = "$row_id";
+
     private final ColumnIdentity baseColumnIdentity;
     private final Type baseType;
     // The list of field ids to indicate the projected part of the top-level column represented by baseColumnIdentity
@@ -138,6 +153,21 @@ public boolean isBaseColumn()
         return path.isEmpty();
     }
 
+    public boolean isIcebergRowPositionMetadataColumn()
+    {
+        return id == ROW_POSITION.fieldId();
+    }
+
+    public boolean isIcebergIsDeletedMetadataColumn()
+    {
+        return id == IS_DELETED.fieldId();
+    }
+
+    public boolean isTrinoRowIdColumn()
+    {
+        return id == TRINO_ROW_ID_COLUMN_ID;
+    }
+
     @Override
     public int hashCode()
     {

diff --git a/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergConfig.java b/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergConfig.java
@@ -19,6 +19,7 @@
 import io.trino.plugin.hive.HiveCompressionCodec;
 import org.apache.iceberg.FileFormat;
 
+import javax.validation.constraints.Max;
 import javax.validation.constraints.Min;
 import javax.validation.constraints.NotNull;
 
@@ -29,6 +30,9 @@
 
 public class IcebergConfig
 {
+    public static final int FORMAT_VERSION_SUPPORT_MIN = 1;
+    public static final int FORMAT_VERSION_SUPPORT_MAX = 2;
+
     private IcebergFileFormat fileFormat = ORC;
     private HiveCompressionCodec compressionCodec = GZIP;
     private boolean useFileSizeFromMetadata = true;
@@ -38,6 +42,7 @@ public class IcebergConfig
     private Duration dynamicFilteringWaitTimeout = new Duration(0, SECONDS);
     private boolean tableStatisticsEnabled = true;
     private boolean projectionPushdownEnabled = true;
+    private int formatVersion = FORMAT_VERSION_SUPPORT_MIN;
 
     public CatalogType getCatalogType()
     {
@@ -167,4 +172,19 @@ public IcebergConfig setProjectionPushdownEnabled(boolean projectionPushdownEnab
         this.projectionPushdownEnabled = projectionPushdownEnabled;
         return this;
     }
+
+    @Min(FORMAT_VERSION_SUPPORT_MIN)
+    @Max(FORMAT_VERSION_SUPPORT_MAX)
+    public int getFormatVersion()
+    {
+        return formatVersion;
+    }
+
+    @Config("iceberg.format-version")
+    @ConfigDescription("Iceberg table format version to use when creating a table")
+    public IcebergConfig setFormatVersion(int formatVersion)
+    {
+        this.formatVersion = formatVersion;
+        return this;
+    }
 }
diff --git a/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergFileWriterFactory.java b/plugin/trino-iceberg/src/main/java/io/trino/plugin/iceberg/IcebergFileWriterFactory.java
@@ -35,6 +35,7 @@
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
 import org.apache.hadoop.mapred.JobConf;
+import org.apache.iceberg.FileContent;
 import org.apache.iceberg.FileFormat;
 import org.apache.iceberg.Schema;
 import org.apache.iceberg.types.Types;
@@ -110,11 +111,12 @@ public IcebergFileWriter createFileWriter(
             JobConf jobConf,
             ConnectorSession session,
             HdfsContext hdfsContext,
-            FileFormat fileFormat)
+            FileFormat fileFormat,
+            FileContent fileContent)
     {
         switch (fileFormat) {
             case PARQUET:
-                return createParquetWriter(outputPath, icebergSchema, jobConf, session, hdfsContext);
+                return createParquetWriter(outputPath, icebergSchema, jobConf, session, hdfsContext, fileContent);
             case ORC:
                 return createOrcWriter(outputPath, icebergSchema, jobConf, session);
             default:
@@ -127,7 +129,8 @@ private IcebergFileWriter createParquetWriter(
             Schema icebergSchema,
             JobConf jobConf,
             ConnectorSession session,
-            HdfsContext hdfsContext)
+            HdfsContext hdfsContext,
+            FileContent fileContent)
     {
         List<String> fileColumnNames = icebergSchema.columns().stream()
                 .map(Types.NestedField::name)
@@ -162,7 +165,8 @@ private IcebergFileWriter createParquetWriter(
                     nodeVersion.toString(),
                     outputPath,
                     hdfsEnvironment,
-                    hdfsContext);
+                    hdfsContext,
+                    fileContent);
         }
         catch (IOException e) {
             throw new TrinoException(ICEBERG_WRITER_OPEN_ERROR, "Error creating Parquet file", e);