apache · felixYyu · Apr 21, 2022 · Apr 21, 2022 · Sep 26, 2022 · Sep 26, 2022
diff --git a/api/src/main/java/org/apache/iceberg/UnboundPartitionSpec.java b/api/src/main/java/org/apache/iceberg/UnboundPartitionSpec.java
@@ -22,6 +22,7 @@
 import org.apache.iceberg.relocated.com.google.common.collect.Lists;
 import org.apache.iceberg.transforms.Transform;
 import org.apache.iceberg.transforms.Transforms;
+import org.apache.iceberg.types.Types;
 
 public class UnboundPartitionSpec {
 
@@ -53,10 +54,13 @@ private PartitionSpec.Builder copyToBuilder(Schema schema) {
     PartitionSpec.Builder builder = PartitionSpec.builderFor(schema).withSpecId(specId);
 
     for (UnboundPartitionField field : fields) {
-      if (field.partitionId != null) {
-        builder.add(field.sourceId, field.partitionId, field.name, field.transform);
-      } else {
-        builder.add(field.sourceId, field.name, field.transform);
+      Types.NestedField column = schema.findField(field.sourceId);
+      if (column != null) {
+        if (field.partitionId != null) {
+          builder.add(field.sourceId, field.partitionId, field.name, field.transform);
+        } else {
+          builder.add(field.sourceId, field.name, field.transform);
+        }
       }
     }
 

diff --git a/...ions/src/test/java/org/apache/iceberg/spark/extensions/TestAlterTablePartitionFields.java b/...ions/src/test/java/org/apache/iceberg/spark/extensions/TestAlterTablePartitionFields.java
@@ -18,9 +18,11 @@
  */
 package org.apache.iceberg.spark.extensions;
 
+import java.sql.Timestamp;
 import java.util.Map;
 import org.apache.iceberg.PartitionSpec;
 import org.apache.iceberg.Table;
+import org.apache.iceberg.relocated.com.google.common.collect.ImmutableList;
 import org.apache.iceberg.spark.source.SparkTable;
 import org.apache.spark.sql.connector.catalog.CatalogManager;
 import org.apache.spark.sql.connector.catalog.Identifier;
@@ -421,16 +423,97 @@ public void testSparkTableAddDropPartitions() throws Exception {
         "spark table partition should be empty", 0, sparkTable().partitioning().length);
   }
 
+  @Test
+  public void testUnboundPartitionSpecFormatVersion1() throws Exception {
+    sql(
+        "CREATE TABLE IF NOT EXISTS %s (id bigint NOT NULL, ts timestamp, data string) USING iceberg "
+            + "TBLPROPERTIES ('format-version' = 1, 'write.delete.mode' = 'merge-on-read')",
+        tableName);
+    Assert.assertEquals(
+        "spark table partition should be empty", 0, sparkTable().partitioning().length);
+
+    sql("INSERT INTO %s VALUES (1, current_timestamp(), 'format-version-1-first-data')", tableName);
+    Assert.assertEquals(
+        "Should have 1 rows after insert", 1L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s ADD PARTITION FIELD truncate(data, 4)", tableName);
+    assertPartitioningEquals(sparkTable(), 1, "truncate(data, 4)");
+
+    sql(
+        "INSERT INTO %s VALUES (2, current_timestamp(), 'format-version-1-second-data')",
+        tableName);
+    Assert.assertEquals(
+        "Should have 2 rows after insert", 2L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s DROP PARTITION FIELD truncate(data, 4)", tableName);
+    Assert.assertEquals(
+        "spark table partition should be empty", 0, sparkTable().partitioning().length);
+
+    sql("INSERT INTO %s VALUES (3, current_timestamp(), 'format-version-1-third-data')", tableName);
+    Assert.assertEquals(
+        "Should have 3 rows after insert", 3L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s DROP COLUMN data", tableName);
+
+    Assert.assertEquals(
+        "Should have 3 rows after insert", 3L, scalarSql("SELECT count(*) FROM %s", tableName));
+  }
+
+  @Test
+  public void testUnboundPartitionSpecFormatVersion2() throws Exception {
+    sql(
+        "CREATE TABLE IF NOT EXISTS %s (id bigint NOT NULL, ts timestamp, data string) USING iceberg "
+            + "TBLPROPERTIES ('format-version' = 2, 'write.delete.mode' = 'merge-on-read')",
+        tableName);
+    Assert.assertEquals(
+        "spark table partition should be empty", 0, sparkTable().partitioning().length);
+
+    sql("INSERT INTO %s VALUES (1, current_timestamp(), 'format-version-2-first-data')", tableName);
+    Assert.assertEquals(
+        "Should have 1 rows after insert", 1L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s ADD PARTITION FIELD truncate(data, 4)", tableName);
+    assertPartitioningEquals(sparkTable(), 1, "truncate(data, 4)");
+
+    sql(
+        "INSERT INTO %s VALUES (2, current_timestamp(), 'format-version-2-second-data')",
+        tableName);
+    Assert.assertEquals(
+        "Should have 2 rows after insert", 2L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s DROP PARTITION FIELD truncate(data, 4)", tableName);
+    Assert.assertEquals(
+        "spark table partition should be empty", 0, sparkTable().partitioning().length);
+
+    sql("INSERT INTO %s VALUES (3, current_timestamp(), 'format-version-2-third-data')", tableName);
+    Assert.assertEquals(
+        "Should have 3 rows after insert", 3L, scalarSql("SELECT count(*) FROM %s", tableName));
+
+    sql("ALTER TABLE %s DROP COLUMN data", tableName);
+
+    Assert.assertEquals(
+        "Should have 3 rows after insert", 3L, scalarSql("SELECT count(*) FROM %s", tableName));
+  }
+
   @Test
   public void testDropColumnOfOldPartitionFieldV1() {
     // default table created in v1 format
     sql(
         "CREATE TABLE %s (id bigint NOT NULL, ts timestamp, day_of_ts date) USING iceberg PARTITIONED BY (day_of_ts) TBLPROPERTIES('format-version' = '1')",
         tableName);
 
+    sql(
+        "INSERT INTO %s VALUES (1, CAST('2022-01-01 10:00:00' AS TIMESTAMP), CAST('2022-01-01' AS DATE))",
+        tableName);
+
     sql("ALTER TABLE %s REPLACE PARTITION FIELD day_of_ts WITH days(ts)", tableName);
 
     sql("ALTER TABLE %s DROP COLUMN day_of_ts", tableName);
+
+    assertEquals(
+        "Should have expected rows",
+        ImmutableList.of(row(1L, Timestamp.valueOf("2022-01-01 10:00:00"))),
+        sql("SELECT * FROM %s WHERE ts < current_timestamp()", tableName));
   }
 
   @Test
@@ -439,9 +522,18 @@ public void testDropColumnOfOldPartitionFieldV2() {
         "CREATE TABLE %s (id bigint NOT NULL, ts timestamp, day_of_ts date) USING iceberg PARTITIONED BY (day_of_ts) TBLPROPERTIES('format-version' = '2')",
         tableName);
 
+    sql(
+        "INSERT INTO %s VALUES (1, CAST('2022-01-01 10:00:00' AS TIMESTAMP), CAST('2022-01-01' AS DATE))",
+        tableName);
+
     sql("ALTER TABLE %s REPLACE PARTITION FIELD day_of_ts WITH days(ts)", tableName);
 
     sql("ALTER TABLE %s DROP COLUMN day_of_ts", tableName);
+
+    assertEquals(
+        "Should have expected rows",
+        ImmutableList.of(row(1L, Timestamp.valueOf("2022-01-01 10:00:00"))),
+        sql("SELECT * FROM %s WHERE ts < current_timestamp()", tableName));
   }
 
   private void assertPartitioningEquals(SparkTable table, int len, String transform) {