apache · ramitg254 · Apr 8, 2026 · Apr 9, 2026 · Apr 9, 2026 · Apr 10, 2026
diff --git a/...g/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/HiveIcebergStorageHandler.java b/...g/iceberg-handler/src/main/java/org/apache/iceberg/mr/hive/HiveIcebergStorageHandler.java
@@ -1536,10 +1536,10 @@ public List<FieldSchema> acidSelectColumns(org.apache.hadoop.hive.ql.metadata.Ta
       case DELETE ->
         // TODO: make it configurable whether we want to include the table columns in the select query.
         // It might make delete writes faster if we don't have to write out the row object
-          ListUtils.union(ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA, table.getCols());
+          ListUtils.union(ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA, table.getAllCols());
       case UPDATE -> shouldOverwrite(table, operation) ?
           ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA :
-          ListUtils.union(ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA, table.getCols());
+          ListUtils.union(ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA, table.getAllCols());
       case MERGE -> ACID_VIRTUAL_COLS_AS_FIELD_SCHEMA;
       default -> ImmutableList.of();
     };
@@ -2130,6 +2130,9 @@ public List<Partition> getPartitions(org.apache.hadoop.hive.ql.metadata.Table hm
   }
 
   public boolean isPartitioned(org.apache.hadoop.hive.ql.metadata.Table hmsTable) {
+    if (hmsTable.getMetaTable() != null) {
+      return false;
+    }
     if (!hmsTable.getTTable().isSetId()) {
       return false;
     }
@@ -2275,6 +2278,9 @@ public boolean canPerformMetadataDelete(org.apache.hadoop.hive.ql.metadata.Table
 
   @Override
   public List<FieldSchema> getPartitionKeys(org.apache.hadoop.hive.ql.metadata.Table hmsTable) {
+    if (hmsTable.getMetaTable() != null) {
+      return Collections.emptyList();
+    }
     if (!hmsTable.getTTable().isSetId()) {
       return Collections.emptyList();
     }

diff --git a/...handler/src/test/java/org/apache/iceberg/mr/hive/TestHiveIcebergStorageHandlerNoScan.java b/...handler/src/test/java/org/apache/iceberg/mr/hive/TestHiveIcebergStorageHandlerNoScan.java
@@ -946,7 +946,8 @@ public void testCreateTableWithoutColumnComments() {
   @Test
   public void testCreatePartitionedTableWithColumnComments() {
     TableIdentifier identifier = TableIdentifier.of("default", "partitioned_with_comment_table");
-    String[] expectedDoc = new String[] {"int column", "string column", null, "partition column", null};
+    String[] expectedDoc = new String[] {"int column", "string column", null, "partition column",
+        "Transform: identity"};
     shell.executeStatement("CREATE EXTERNAL TABLE partitioned_with_comment_table (" +
         "t_int INT COMMENT 'int column',  " +
         "t_string STRING COMMENT 'string column', " +
@@ -959,13 +960,18 @@ public void testCreatePartitionedTableWithColumnComments() {
 
     List<Object[]> rows = shell.executeStatement("DESCRIBE default.partitioned_with_comment_table");
     List<Types.NestedField> columns = icebergTable.schema().columns();
+    List<String> partitionColumns = List.of("t_string_3", "t_string_4");
     // The partition transform information and partition information is 6 extra lines, and 4 more line for the columns
     Assert.assertEquals(columns.size() + 10, rows.size());
     for (int i = 0; i < columns.size(); i++) {
       Types.NestedField field = columns.get(i);
-      Assert.assertArrayEquals(new Object[] {field.name(), HiveSchemaUtil.convert(field.type()).getTypeName(),
-          field.doc() != null ? field.doc() : ""}, rows.get(i));
-      Assert.assertEquals(expectedDoc[i], field.doc());
+      String fieldDoc = field.doc();
+      if (fieldDoc == null && partitionColumns.contains(field.name())) {
+        fieldDoc = "Transform: identity";
+      }
+      Assert.assertArrayEquals(new Object[]{field.name(), HiveSchemaUtil.convert(field.type()).getTypeName(),
+          fieldDoc != null ? fieldDoc : ""}, rows.get(i));
+      Assert.assertEquals(expectedDoc[i], fieldDoc);
     }
   }
 

diff --git a/iceberg/iceberg-handler/src/test/results/positive/alter_multi_part_table_to_iceberg.q.out b/iceberg/iceberg-handler/src/test/results/positive/alter_multi_part_table_to_iceberg.q.out
@@ -177,8 +177,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_orc
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
-c                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -453,8 +451,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_parquet
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
-c                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -729,8 +725,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_avro
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
-c                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -1066,9 +1060,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_orc_mixed
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	double              	                    
-c                   	int                 	                    
-d                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -1513,9 +1504,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_parquet_mixed
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	double              	                    
-c                   	int                 	                    
-d                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -1960,9 +1948,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_avro_mixed
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	double              	                    
-c                   	int                 	                    
-d                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             

diff --git a/iceberg/iceberg-handler/src/test/results/positive/alter_part_table_to_iceberg.q.out b/iceberg/iceberg-handler/src/test/results/positive/alter_part_table_to_iceberg.q.out
@@ -137,7 +137,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_orc
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -415,7 +414,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_parquet
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -770,7 +768,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_parquet_int
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	int                 	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -1125,7 +1122,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_parquet_double
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	double              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             
@@ -1426,7 +1422,6 @@ POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_avro
 # col_name            	data_type           	comment             
 a                   	int                 	                    
-b                   	string              	                    
 
 # Partition Information	 	 
 # col_name            	data_type           	comment             

diff --git a/iceberg/iceberg-handler/src/test/results/positive/bucket_map_join_9.q.out b/iceberg/iceberg-handler/src/test/results/positive/bucket_map_join_9.q.out
@@ -34,21 +34,21 @@ Stage-0
     limit:-1
     Stage-1
       Map 1 vectorized
-      File Output Operator [FS_53]
-        Map Join Operator [MAPJOIN_52] (rows=2 width=530)
-          BucketMapJoin:true,Conds:SEL_51._col1, _col2=RS_49._col1, _col2(Inner),Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
+      File Output Operator [FS_23]
+        Map Join Operator [MAPJOIN_22] (rows=2 width=530)
+          BucketMapJoin:true,Conds:SEL_21._col1, _col2=RS_19._col1, _col2(Inner),Output:["_col0","_col1","_col2","_col3","_col4","_col5"]
         <-Map 2 [CUSTOM_EDGE] vectorized
-          MULTICAST [RS_49]
+          MULTICAST [RS_19]
             PartitionCols:_col2, _col1
-            Select Operator [SEL_48] (rows=2 width=265)
+            Select Operator [SEL_18] (rows=2 width=265)
               Output:["_col0","_col1","_col2"]
-              Filter Operator [FIL_47] (rows=2 width=265)
+              Filter Operator [FIL_17] (rows=2 width=265)
                 predicate:(id is not null and part is not null)
                 TableScan [TS_3] (rows=2 width=265)
                   default@tbl,tbl2,Tbl:COMPLETE,Col:COMPLETE,Output:["foid","part","id"]
-        <-Select Operator [SEL_51] (rows=2 width=265)
+        <-Select Operator [SEL_21] (rows=2 width=265)
             Output:["_col0","_col1","_col2"]
-            Filter Operator [FIL_50] (rows=2 width=265)
+            Filter Operator [FIL_20] (rows=2 width=265)
               predicate:(id is not null and part is not null)
               TableScan [TS_0] (rows=2 width=265)
                 default@tbl,tbl,Tbl:COMPLETE,Col:COMPLETE,Grouping Num Buckets:100,Grouping Partition Columns:["id","part"],Output:["foid","part","id"]

diff --git a/iceberg/iceberg-handler/src/test/results/positive/col_stats.q.out b/iceberg/iceberg-handler/src/test/results/positive/col_stats.q.out
@@ -347,7 +347,7 @@ PREHOOK: Input: default@tbl_ice_puffin
 POSTHOOK: query: desc formatted tbl_ice_puffin C
 POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_ice_puffin
-col_name            	C                   
+col_name            	c                   
 data_type           	int                 
 min                 	52                  
 max                 	56                  
@@ -358,7 +358,7 @@ max_col_len
 num_trues           	                    
 num_falses          	                    
 bit_vector          	HL                  
-comment             	                    
+comment             	Transform: identity 
 COLUMN_STATS_ACCURATE	{\"BASIC_STATS\":\"true\",\"COLUMN_STATS\":{\"a\":\"true\",\"b\":\"true\",\"c\":\"true\"}}
 PREHOOK: query: EXPLAIN select count(*) from src_ice t1 join tbl_ice_puffin t2 on (t1.a = t2.a)
 PREHOOK: type: QUERY

diff --git a/iceberg/iceberg-handler/src/test/results/positive/ctas_iceberg_partitioned_orc.q.out b/iceberg/iceberg-handler/src/test/results/positive/ctas_iceberg_partitioned_orc.q.out
@@ -273,8 +273,6 @@ POSTHOOK: query: describe formatted tbl_ice
 POSTHOOK: type: DESCTABLE
 POSTHOOK: Input: default@tbl_ice
 # col_name            	data_type           	comment             
-a                   	int                 	                    
-b                   	string              	                    
 c                   	int                 	                    
 
 # Partition Information