From 60f6611e5ea07404fb000c94565b9186057ec302 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Tue, 12 Nov 2024 22:21:54 +0800
Subject: [PATCH 001/157] [flink] Support updating row type to another row type
 in Flink (#4499)

---
 .../paimon/catalog/AbstractCatalog.java       |   3 +-
 .../apache/paimon/schema/SchemaChange.java    |  56 ++++----
 .../apache/paimon/schema/SchemaManager.java   |  22 ++--
 .../paimon/schema/SchemaManagerTest.java      |  20 +--
 .../UpdatedDataFieldsProcessFunctionBase.java |   8 +-
 .../org/apache/paimon/flink/FlinkCatalog.java | 120 ++++++++++++++++--
 .../paimon/flink/SchemaChangeITCase.java      |  51 +++++++-
 .../org/apache/paimon/spark/SparkCatalog.java |   8 +-
 8 files changed, 213 insertions(+), 75 deletions(-)
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index c2e4afe5d533e..a1cf941cda621 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -48,6 +48,7 @@
 
 import java.io.IOException;
 import java.util.ArrayList;
+import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
@@ -560,7 +561,7 @@ private void validateFieldNameCaseInsensitiveInSchemaChange(List<SchemaChange> c
         for (SchemaChange change : changes) {
             if (change instanceof SchemaChange.AddColumn) {
                 SchemaChange.AddColumn addColumn = (SchemaChange.AddColumn) change;
-                fieldNames.addAll(addColumn.fieldNames());
+                fieldNames.addAll(Arrays.asList(addColumn.fieldNames()));
             } else if (change instanceof SchemaChange.RenameColumn) {
                 SchemaChange.RenameColumn rename = (SchemaChange.RenameColumn) change;
                 fieldNames.add(rename.newName());
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaChange.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaChange.java
index 1c1d601bced8a..cefa3c6eb9e74 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaChange.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaChange.java
@@ -25,8 +25,6 @@
 
 import java.io.Serializable;
 import java.util.Arrays;
-import java.util.Collections;
-import java.util.List;
 import java.util.Objects;
 
 /**
@@ -54,46 +52,45 @@ static SchemaChange addColumn(String fieldName, DataType dataType) {
     }
 
     static SchemaChange addColumn(String fieldName, DataType dataType, String comment) {
-        return new AddColumn(Collections.singletonList(fieldName), dataType, comment, null);
+        return new AddColumn(new String[] {fieldName}, dataType, comment, null);
     }
 
     static SchemaChange addColumn(String fieldName, DataType dataType, String comment, Move move) {
-        return new AddColumn(Collections.singletonList(fieldName), dataType, comment, move);
+        return new AddColumn(new String[] {fieldName}, dataType, comment, move);
     }
 
     static SchemaChange addColumn(
-            List<String> fieldNames, DataType dataType, String comment, Move move) {
+            String[] fieldNames, DataType dataType, String comment, Move move) {
         return new AddColumn(fieldNames, dataType, comment, move);
     }
 
     static SchemaChange renameColumn(String fieldName, String newName) {
-        return new RenameColumn(Collections.singletonList(fieldName), newName);
+        return new RenameColumn(new String[] {fieldName}, newName);
     }
 
-    static SchemaChange renameColumn(List<String> fieldNames, String newName) {
+    static SchemaChange renameColumn(String[] fieldNames, String newName) {
         return new RenameColumn(fieldNames, newName);
     }
 
     static SchemaChange dropColumn(String fieldName) {
-        return new DropColumn(Collections.singletonList(fieldName));
+        return new DropColumn(new String[] {fieldName});
     }
 
-    static SchemaChange dropColumn(List<String> fieldNames) {
+    static SchemaChange dropColumn(String[] fieldNames) {
         return new DropColumn(fieldNames);
     }
 
     static SchemaChange updateColumnType(String fieldName, DataType newDataType) {
-        return new UpdateColumnType(Collections.singletonList(fieldName), newDataType, false);
+        return new UpdateColumnType(new String[] {fieldName}, newDataType, false);
     }
 
     static SchemaChange updateColumnType(
             String fieldName, DataType newDataType, boolean keepNullability) {
-        return new UpdateColumnType(
-                Collections.singletonList(fieldName), newDataType, keepNullability);
+        return new UpdateColumnType(new String[] {fieldName}, newDataType, keepNullability);
     }
 
     static SchemaChange updateColumnType(
-            List<String> fieldNames, DataType newDataType, boolean keepNullability) {
+            String[] fieldNames, DataType newDataType, boolean keepNullability) {
         return new UpdateColumnType(fieldNames, newDataType, keepNullability);
     }
 
@@ -228,20 +225,19 @@ final class AddColumn implements SchemaChange {
 
         private static final long serialVersionUID = 1L;
 
-        private final List<String> fieldNames;
+        private final String[] fieldNames;
         private final DataType dataType;
         private final String description;
         private final Move move;
 
-        private AddColumn(
-                List<String> fieldNames, DataType dataType, String description, Move move) {
+        private AddColumn(String[] fieldNames, DataType dataType, String description, Move move) {
             this.fieldNames = fieldNames;
             this.dataType = dataType;
             this.description = description;
             this.move = move;
         }
 
-        public List<String> fieldNames() {
+        public String[] fieldNames() {
             return fieldNames;
         }
 
@@ -268,7 +264,7 @@ public boolean equals(Object o) {
                 return false;
             }
             AddColumn addColumn = (AddColumn) o;
-            return Objects.equals(fieldNames, addColumn.fieldNames)
+            return Arrays.equals(fieldNames, addColumn.fieldNames)
                     && dataType.equals(addColumn.dataType)
                     && Objects.equals(description, addColumn.description)
                     && move.equals(addColumn.move);
@@ -288,15 +284,15 @@ final class RenameColumn implements SchemaChange {
 
         private static final long serialVersionUID = 1L;
 
-        private final List<String> fieldNames;
+        private final String[] fieldNames;
         private final String newName;
 
-        private RenameColumn(List<String> fieldNames, String newName) {
+        private RenameColumn(String[] fieldNames, String newName) {
             this.fieldNames = fieldNames;
             this.newName = newName;
         }
 
-        public List<String> fieldNames() {
+        public String[] fieldNames() {
             return fieldNames;
         }
 
@@ -313,7 +309,7 @@ public boolean equals(Object o) {
                 return false;
             }
             RenameColumn that = (RenameColumn) o;
-            return Objects.equals(fieldNames, that.fieldNames)
+            return Arrays.equals(fieldNames, that.fieldNames)
                     && Objects.equals(newName, that.newName);
         }
 
@@ -330,13 +326,13 @@ final class DropColumn implements SchemaChange {
 
         private static final long serialVersionUID = 1L;
 
-        private final List<String> fieldNames;
+        private final String[] fieldNames;
 
-        private DropColumn(List<String> fieldNames) {
+        private DropColumn(String[] fieldNames) {
             this.fieldNames = fieldNames;
         }
 
-        public List<String> fieldNames() {
+        public String[] fieldNames() {
             return fieldNames;
         }
 
@@ -349,7 +345,7 @@ public boolean equals(Object o) {
                 return false;
             }
             DropColumn that = (DropColumn) o;
-            return Objects.equals(fieldNames, that.fieldNames);
+            return Arrays.equals(fieldNames, that.fieldNames);
         }
 
         @Override
@@ -363,19 +359,19 @@ final class UpdateColumnType implements SchemaChange {
 
         private static final long serialVersionUID = 1L;
 
-        private final List<String> fieldNames;
+        private final String[] fieldNames;
         private final DataType newDataType;
         // If true, do not change the target field nullability
         private final boolean keepNullability;
 
         private UpdateColumnType(
-                List<String> fieldNames, DataType newDataType, boolean keepNullability) {
+                String[] fieldNames, DataType newDataType, boolean keepNullability) {
             this.fieldNames = fieldNames;
             this.newDataType = newDataType;
             this.keepNullability = keepNullability;
         }
 
-        public List<String> fieldNames() {
+        public String[] fieldNames() {
             return fieldNames;
         }
 
@@ -396,7 +392,7 @@ public boolean equals(Object o) {
                 return false;
             }
             UpdateColumnType that = (UpdateColumnType) o;
-            return Objects.equals(fieldNames, that.fieldNames)
+            return Arrays.equals(fieldNames, that.fieldNames)
                     && newDataType.equals(that.newDataType);
         }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index 86ed96d5b01ba..28cc69cf99d7b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -290,7 +290,7 @@ public TableSchema commitChanges(List<SchemaChange> changes)
                     DataType dataType =
                             ReassignFieldId.reassign(addColumn.dataType(), highestFieldId);
 
-                    new NestedColumnModifier(addColumn.fieldNames().toArray(new String[0])) {
+                    new NestedColumnModifier(addColumn.fieldNames()) {
                         @Override
                         protected void updateLastColumn(List<DataField> newFields, String fieldName)
                                 throws Catalog.ColumnAlreadyExistException {
@@ -320,7 +320,7 @@ protected void updateLastColumn(List<DataField> newFields, String fieldName)
                 } else if (change instanceof RenameColumn) {
                     RenameColumn rename = (RenameColumn) change;
                     assertNotUpdatingPrimaryKeys(oldTableSchema, rename.fieldNames(), "rename");
-                    new NestedColumnModifier(rename.fieldNames().toArray(new String[0])) {
+                    new NestedColumnModifier(rename.fieldNames()) {
                         @Override
                         protected void updateLastColumn(List<DataField> newFields, String fieldName)
                                 throws Catalog.ColumnNotExistException,
@@ -347,7 +347,7 @@ protected void updateLastColumn(List<DataField> newFields, String fieldName)
                 } else if (change instanceof DropColumn) {
                     DropColumn drop = (DropColumn) change;
                     dropColumnValidation(oldTableSchema, drop);
-                    new NestedColumnModifier(drop.fieldNames().toArray(new String[0])) {
+                    new NestedColumnModifier(drop.fieldNames()) {
                         @Override
                         protected void updateLastColumn(List<DataField> newFields, String fieldName)
                                 throws Catalog.ColumnNotExistException {
@@ -364,7 +364,7 @@ protected void updateLastColumn(List<DataField> newFields, String fieldName)
                     assertNotUpdatingPrimaryKeys(oldTableSchema, update.fieldNames(), "update");
                     updateNestedColumn(
                             newFields,
-                            update.fieldNames().toArray(new String[0]),
+                            update.fieldNames(),
                             (field) -> {
                                 DataType targetType = update.newDataType();
                                 if (update.keepNullability()) {
@@ -558,8 +558,8 @@ private static List<String> applyNotNestedColumnRename(
 
         Map<String, String> columnNames = Maps.newHashMap();
         for (RenameColumn renameColumn : renames) {
-            if (renameColumn.fieldNames().size() == 1) {
-                columnNames.put(renameColumn.fieldNames().get(0), renameColumn.newName());
+            if (renameColumn.fieldNames().length == 1) {
+                columnNames.put(renameColumn.fieldNames()[0], renameColumn.newName());
             }
         }
 
@@ -571,10 +571,10 @@ private static List<String> applyNotNestedColumnRename(
 
     private static void dropColumnValidation(TableSchema schema, DropColumn change) {
         // primary keys and partition keys can't be nested columns
-        if (change.fieldNames().size() > 1) {
+        if (change.fieldNames().length > 1) {
             return;
         }
-        String columnToDrop = change.fieldNames().get(0);
+        String columnToDrop = change.fieldNames()[0];
         if (schema.partitionKeys().contains(columnToDrop)
                 || schema.primaryKeys().contains(columnToDrop)) {
             throw new UnsupportedOperationException(
@@ -583,12 +583,12 @@ private static void dropColumnValidation(TableSchema schema, DropColumn change)
     }
 
     private static void assertNotUpdatingPrimaryKeys(
-            TableSchema schema, List<String> fieldNames, String operation) {
+            TableSchema schema, String[] fieldNames, String operation) {
         // partition keys can't be nested columns
-        if (fieldNames.size() > 1) {
+        if (fieldNames.length > 1) {
             return;
         }
-        String columnToRename = fieldNames.get(0);
+        String columnToRename = fieldNames[0];
         if (schema.partitionKeys().contains(columnToRename)) {
             throw new UnsupportedOperationException(
                     String.format(
diff --git a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
index ac8d4cd91e1d8..088cb72f92e6c 100644
--- a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
@@ -555,7 +555,7 @@ public void testAddAndDropNestedColumns() throws Exception {
 
         SchemaChange addColumn =
                 SchemaChange.addColumn(
-                        Arrays.asList("v", "f2", "f3"),
+                        new String[] {"v", "f2", "f3"},
                         DataTypes.STRING(),
                         "",
                         SchemaChange.Move.after("f3", "f1"));
@@ -579,11 +579,11 @@ public void testAddAndDropNestedColumns() throws Exception {
                 .hasMessageContaining("Column v.f2.f3 already exists");
         SchemaChange middleColumnNotExistAddColumn =
                 SchemaChange.addColumn(
-                        Arrays.asList("v", "invalid", "f4"), DataTypes.STRING(), "", null);
+                        new String[] {"v", "invalid", "f4"}, DataTypes.STRING(), "", null);
         assertThatCode(() -> manager.commitChanges(middleColumnNotExistAddColumn))
                 .hasMessageContaining("Column v.invalid does not exist");
 
-        SchemaChange dropColumn = SchemaChange.dropColumn(Arrays.asList("v", "f2", "f1"));
+        SchemaChange dropColumn = SchemaChange.dropColumn(new String[] {"v", "f2", "f1"});
         manager.commitChanges(dropColumn);
 
         innerType =
@@ -602,7 +602,7 @@ public void testAddAndDropNestedColumns() throws Exception {
         assertThatCode(() -> manager.commitChanges(dropColumn))
                 .hasMessageContaining("Column v.f2.f1 does not exist");
         SchemaChange middleColumnNotExistDropColumn =
-                SchemaChange.dropColumn(Arrays.asList("v", "invalid", "f2"));
+                SchemaChange.dropColumn(new String[] {"v", "invalid", "f2"});
         assertThatCode(() -> manager.commitChanges(middleColumnNotExistDropColumn))
                 .hasMessageContaining("Column v.invalid does not exist");
     }
@@ -632,7 +632,7 @@ public void testRenameNestedColumns() throws Exception {
         manager.createTable(schema);
 
         SchemaChange renameColumn =
-                SchemaChange.renameColumn(Arrays.asList("v", "f2", "f1"), "f100");
+                SchemaChange.renameColumn(new String[] {"v", "f2", "f1"}, "f100");
         manager.commitChanges(renameColumn);
 
         innerType =
@@ -649,17 +649,17 @@ public void testRenameNestedColumns() throws Exception {
         assertThat(manager.latest().get().logicalRowType()).isEqualTo(outerType);
 
         SchemaChange middleColumnNotExistRenameColumn =
-                SchemaChange.renameColumn(Arrays.asList("v", "invalid", "f2"), "f200");
+                SchemaChange.renameColumn(new String[] {"v", "invalid", "f2"}, "f200");
         assertThatCode(() -> manager.commitChanges(middleColumnNotExistRenameColumn))
                 .hasMessageContaining("Column v.invalid does not exist");
 
         SchemaChange lastColumnNotExistRenameColumn =
-                SchemaChange.renameColumn(Arrays.asList("v", "f2", "invalid"), "new_invalid");
+                SchemaChange.renameColumn(new String[] {"v", "f2", "invalid"}, "new_invalid");
         assertThatCode(() -> manager.commitChanges(lastColumnNotExistRenameColumn))
                 .hasMessageContaining("Column v.f2.invalid does not exist");
 
         SchemaChange newNameAlreadyExistRenameColumn =
-                SchemaChange.renameColumn(Arrays.asList("v", "f2", "f2"), "f100");
+                SchemaChange.renameColumn(new String[] {"v", "f2", "f2"}, "f100");
         assertThatCode(() -> manager.commitChanges(newNameAlreadyExistRenameColumn))
                 .hasMessageContaining("Column v.f2.f100 already exists");
     }
@@ -690,7 +690,7 @@ public void testUpdateNestedColumnType() throws Exception {
 
         SchemaChange updateColumnType =
                 SchemaChange.updateColumnType(
-                        Arrays.asList("v", "f2", "f1"), DataTypes.BIGINT(), true);
+                        new String[] {"v", "f2", "f1"}, DataTypes.BIGINT(), true);
         manager.commitChanges(updateColumnType);
 
         innerType =
@@ -708,7 +708,7 @@ public void testUpdateNestedColumnType() throws Exception {
 
         SchemaChange middleColumnNotExistUpdateColumnType =
                 SchemaChange.updateColumnType(
-                        Arrays.asList("v", "invalid", "f1"), DataTypes.BIGINT(), true);
+                        new String[] {"v", "invalid", "f1"}, DataTypes.BIGINT(), true);
         assertThatCode(() -> manager.commitChanges(middleColumnNotExistUpdateColumnType))
                 .hasMessageContaining("Column v.invalid does not exist");
     }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
index 0e93fdb073244..c2e928bd4a0aa 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
@@ -101,7 +101,7 @@ protected void applySchemaChange(
             SchemaChange.UpdateColumnType updateColumnType =
                     (SchemaChange.UpdateColumnType) schemaChange;
             Preconditions.checkState(
-                    updateColumnType.fieldNames().size() == 1,
+                    updateColumnType.fieldNames().length == 1,
                     "Paimon CDC currently does not support nested type schema evolution.");
             TableSchema schema =
                     schemaManager
@@ -110,11 +110,11 @@ protected void applySchemaChange(
                                     () ->
                                             new RuntimeException(
                                                     "Table does not exist. This is unexpected."));
-            int idx = schema.fieldNames().indexOf(updateColumnType.fieldNames().get(0));
+            int idx = schema.fieldNames().indexOf(updateColumnType.fieldNames()[0]);
             Preconditions.checkState(
                     idx >= 0,
                     "Field name "
-                            + updateColumnType.fieldNames().get(0)
+                            + updateColumnType.fieldNames()[0]
                             + " does not exist in table. This is unexpected.");
             DataType oldType = schema.fields().get(idx).type();
             DataType newType = updateColumnType.newDataType();
@@ -126,7 +126,7 @@ protected void applySchemaChange(
                     throw new UnsupportedOperationException(
                             String.format(
                                     "Cannot convert field %s from type %s to %s of Paimon table %s.",
-                                    updateColumnType.fieldNames().get(0),
+                                    updateColumnType.fieldNames()[0],
                                     oldType,
                                     newType,
                                     identifier.getFullName()));
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
index cae6e6f0e3672..ae30fa569d59e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
@@ -37,6 +37,8 @@
 import org.apache.paimon.table.Table;
 import org.apache.paimon.table.sink.BatchWriteBuilder;
 import org.apache.paimon.table.source.ReadBuilder;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.DataTypeRoot;
 import org.apache.paimon.utils.FileStorePathFactory;
 import org.apache.paimon.utils.InternalRowPartitionComputer;
 import org.apache.paimon.utils.Preconditions;
@@ -98,7 +100,6 @@
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.factories.Factory;
 import org.apache.flink.table.procedures.Procedure;
-import org.apache.flink.table.types.logical.LogicalType;
 import org.apache.flink.table.types.logical.RowType;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -110,11 +111,13 @@
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
+import java.util.HashSet;
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
 import java.util.Optional;
+import java.util.Set;
 import java.util.function.Function;
 import java.util.stream.Collectors;
 
@@ -595,17 +598,12 @@ private List<SchemaChange> toSchemaChange(
             if (!oldTableNonPhysicalColumnIndex.containsKey(
                     ((ModifyPhysicalColumnType) change).getOldColumn().getName())) {
                 ModifyPhysicalColumnType modify = (ModifyPhysicalColumnType) change;
-                LogicalType newColumnType = modify.getNewType().getLogicalType();
-                LogicalType oldColumnType = modify.getOldColumn().getDataType().getLogicalType();
-                if (newColumnType.isNullable() != oldColumnType.isNullable()) {
-                    schemaChanges.add(
-                            SchemaChange.updateColumnNullability(
-                                    modify.getNewColumn().getName(), newColumnType.isNullable()));
-                }
-                schemaChanges.add(
-                        SchemaChange.updateColumnType(
-                                modify.getOldColumn().getName(),
-                                LogicalTypeConversion.toDataType(newColumnType)));
+                generateNestedColumnUpdates(
+                        Collections.singletonList(modify.getOldColumn().getName()),
+                        LogicalTypeConversion.toDataType(
+                                modify.getOldColumn().getDataType().getLogicalType()),
+                        LogicalTypeConversion.toDataType(modify.getNewType().getLogicalType()),
+                        schemaChanges);
             }
             return schemaChanges;
         } else if (change instanceof ModifyColumnPosition) {
@@ -670,6 +668,104 @@ && handleMaterializedTableChange(change, schemaChanges)) {
         throw new UnsupportedOperationException("Change is not supported: " + change.getClass());
     }
 
+    private void generateNestedColumnUpdates(
+            List<String> fieldNames,
+            org.apache.paimon.types.DataType oldType,
+            org.apache.paimon.types.DataType newType,
+            List<SchemaChange> schemaChanges) {
+        if (oldType.getTypeRoot() == DataTypeRoot.ROW) {
+            Preconditions.checkArgument(
+                    newType.getTypeRoot() == DataTypeRoot.ROW,
+                    "Column "
+                            + String.join(".", fieldNames)
+                            + " can only be updated to row type, and cannot be updated to "
+                            + newType
+                            + " type");
+            org.apache.paimon.types.RowType oldRowType = (org.apache.paimon.types.RowType) oldType;
+            org.apache.paimon.types.RowType newRowType = (org.apache.paimon.types.RowType) newType;
+
+            // check that existing fields have same order
+            Map<String, Integer> oldFieldOrders = new HashMap<>();
+            for (int i = 0; i < oldRowType.getFieldCount(); i++) {
+                oldFieldOrders.put(oldRowType.getFields().get(i).name(), i);
+            }
+            int lastIdx = -1;
+            String lastFieldName = "";
+            for (DataField newField : newRowType.getFields()) {
+                String name = newField.name();
+                if (oldFieldOrders.containsKey(name)) {
+                    int idx = oldFieldOrders.get(name);
+                    Preconditions.checkState(
+                            lastIdx < idx,
+                            "Order of existing fields in column %s must be kept the same. "
+                                    + "However, field %s and %s have changed their orders.",
+                            String.join(".", fieldNames),
+                            lastFieldName,
+                            name);
+                    lastIdx = idx;
+                    lastFieldName = name;
+                }
+            }
+
+            // drop fields
+            Set<String> newFieldNames = new HashSet<>(newRowType.getFieldNames());
+            for (String name : oldRowType.getFieldNames()) {
+                if (!newFieldNames.contains(name)) {
+                    List<String> dropColumnNames = new ArrayList<>(fieldNames);
+                    dropColumnNames.add(name);
+                    schemaChanges.add(
+                            SchemaChange.dropColumn(dropColumnNames.toArray(new String[0])));
+                }
+            }
+
+            for (int i = 0; i < newRowType.getFieldCount(); i++) {
+                DataField field = newRowType.getFields().get(i);
+                String name = field.name();
+                List<String> fullFieldNames = new ArrayList<>(fieldNames);
+                fullFieldNames.add(name);
+                if (!oldFieldOrders.containsKey(name)) {
+                    // add fields
+                    SchemaChange.Move move;
+                    if (i == 0) {
+                        move = SchemaChange.Move.first(name);
+                    } else {
+                        String lastName = newRowType.getFields().get(i - 1).name();
+                        move = SchemaChange.Move.after(name, lastName);
+                    }
+                    schemaChanges.add(
+                            SchemaChange.addColumn(
+                                    fullFieldNames.toArray(new String[0]),
+                                    field.type(),
+                                    field.description(),
+                                    move));
+                } else {
+                    // update existing fields
+                    DataField oldField = oldRowType.getFields().get(oldFieldOrders.get(name));
+                    if (!Objects.equals(oldField.description(), field.description())) {
+                        schemaChanges.add(
+                                SchemaChange.updateColumnComment(
+                                        fullFieldNames.toArray(new String[0]),
+                                        field.description()));
+                    }
+                    generateNestedColumnUpdates(
+                            fullFieldNames, oldField.type(), field.type(), schemaChanges);
+                }
+            }
+        } else {
+            if (!oldType.equalsIgnoreNullable(newType)) {
+                schemaChanges.add(
+                        SchemaChange.updateColumnType(
+                                fieldNames.toArray(new String[0]), newType, false));
+            }
+        }
+
+        if (oldType.isNullable() != newType.isNullable()) {
+            schemaChanges.add(
+                    SchemaChange.updateColumnNullability(
+                            fieldNames.toArray(new String[0]), newType.isNullable()));
+        }
+    }
+
     /**
      * Try handle change related to materialized table.
      *
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
index 08f79efccb763..ba161fe84008f 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
@@ -25,6 +25,8 @@
 import org.apache.flink.table.api.config.ExecutionConfigOptions;
 import org.apache.flink.types.Row;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.ValueSource;
 
 import java.time.format.DateTimeFormatter;
 import java.util.List;
@@ -35,6 +37,7 @@
 
 import static org.apache.paimon.testutils.assertj.PaimonAssertions.anyCauseMatches;
 import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatCode;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
 /** ITCase for schema changes. */
@@ -1015,7 +1018,6 @@ public void testSequenceFieldSortOrder() {
         sql("INSERT INTO T1 VALUES ('a', 'b', 'l')");
         sql("INSERT INTO T1 VALUES ('a', 'd', 'n')");
         sql("INSERT INTO T1 VALUES ('a', 'e', 'm')");
-        List<Row> sql = sql("select * from T1");
         assertThat(sql("select * from T1").toString()).isEqualTo("[+I[a, d, n]]");
 
         // test for get small record
@@ -1024,7 +1026,6 @@ public void testSequenceFieldSortOrder() {
         sql("INSERT INTO T2 VALUES ('a', 'b', 1)");
         sql("INSERT INTO T2 VALUES ('a', 'd', 3)");
         sql("INSERT INTO T2 VALUES ('a', 'e', 2)");
-        sql = sql("select * from T2");
         assertThat(sql("select * from T2").toString()).isEqualTo("[+I[a, b, 1]]");
 
         // test for get largest record
@@ -1033,7 +1034,6 @@ public void testSequenceFieldSortOrder() {
         sql("INSERT INTO T3 VALUES ('a', 'b', 1.0)");
         sql("INSERT INTO T3 VALUES ('a', 'd', 3.0)");
         sql("INSERT INTO T3 VALUES ('a', 'e', 2.0)");
-        sql = sql("select * from T3");
         assertThat(sql("select * from T3").toString()).isEqualTo("[+I[a, d, 3.0]]");
     }
 
@@ -1089,4 +1089,49 @@ public void testAlterBucket() {
                                 UnsupportedOperationException.class,
                                 "Cannot change bucket to -1."));
     }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testUpdateNestedColumn(String formatType) {
+        sql(
+                "CREATE TABLE T "
+                        + "( k INT, v ROW(f1 INT, f2 ROW(f1 STRING, f2 INT NOT NULL)), PRIMARY KEY (k) NOT ENFORCED ) "
+                        + "WITH ( 'bucket' = '1', 'file.format' = '"
+                        + formatType
+                        + "' )");
+        sql(
+                "INSERT INTO T VALUES (1, ROW(10, ROW('apple', 100))), (2, ROW(20, ROW('banana', 200)))");
+        assertThat(sql("SELECT * FROM T"))
+                .containsExactlyInAnyOrder(
+                        Row.of(1, Row.of(10, Row.of("apple", 100))),
+                        Row.of(2, Row.of(20, Row.of("banana", 200))));
+
+        sql("ALTER TABLE T MODIFY (v ROW(f1 BIGINT, f2 ROW(f3 DOUBLE, f2 INT), f3 STRING))");
+        sql(
+                "INSERT INTO T VALUES "
+                        + "(1, ROW(1000000000001, ROW(101.0, 101), 'cat')), "
+                        + "(3, ROW(3000000000001, ROW(301.0, CAST(NULL AS INT)), 'dog'))");
+        assertThat(sql("SELECT * FROM T"))
+                .containsExactlyInAnyOrder(
+                        Row.of(1, Row.of(1000000000001L, Row.of(101.0, 101), "cat")),
+                        Row.of(2, Row.of(20L, Row.of(null, 200), null)),
+                        Row.of(3, Row.of(3000000000001L, Row.of(301.0, null), "dog")));
+
+        sql(
+                "ALTER TABLE T MODIFY (v ROW(f1 BIGINT, f2 ROW(f3 DOUBLE, f1 STRING, f2 INT), f3 STRING))");
+        sql(
+                "INSERT INTO T VALUES "
+                        + "(1, ROW(1000000000002, ROW(102.0, 'APPLE', 102), 'cat')), "
+                        + "(4, ROW(4000000000002, ROW(402.0, 'LEMON', 402), 'tiger'))");
+        assertThat(sql("SELECT k, v.f2.f1, v.f3 FROM T"))
+                .containsExactlyInAnyOrder(
+                        Row.of(1, "APPLE", "cat"),
+                        Row.of(2, null, null),
+                        Row.of(3, null, "dog"),
+                        Row.of(4, "LEMON", "tiger"));
+
+        assertThatCode(() -> sql("ALTER TABLE T MODIFY (v ROW(f1 BIGINT, f2 INT, f3 STRING))"))
+                .hasRootCauseMessage(
+                        "Column v.f2 can only be updated to row type, and cannot be updated to INT type");
+    }
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
index 5fde2c56596f6..89448c1f4310a 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
@@ -373,20 +373,20 @@ private SchemaChange toSchemaChange(TableChange change) {
             TableChange.AddColumn add = (TableChange.AddColumn) change;
             SchemaChange.Move move = getMove(add.position(), add.fieldNames());
             return SchemaChange.addColumn(
-                    Arrays.asList(add.fieldNames()),
+                    add.fieldNames(),
                     toPaimonType(add.dataType()).copy(add.isNullable()),
                     add.comment(),
                     move);
         } else if (change instanceof TableChange.RenameColumn) {
             TableChange.RenameColumn rename = (TableChange.RenameColumn) change;
-            return SchemaChange.renameColumn(Arrays.asList(rename.fieldNames()), rename.newName());
+            return SchemaChange.renameColumn(rename.fieldNames(), rename.newName());
         } else if (change instanceof TableChange.DeleteColumn) {
             TableChange.DeleteColumn delete = (TableChange.DeleteColumn) change;
-            return SchemaChange.dropColumn(Arrays.asList(delete.fieldNames()));
+            return SchemaChange.dropColumn(delete.fieldNames());
         } else if (change instanceof TableChange.UpdateColumnType) {
             TableChange.UpdateColumnType update = (TableChange.UpdateColumnType) change;
             return SchemaChange.updateColumnType(
-                    Arrays.asList(update.fieldNames()), toPaimonType(update.newDataType()), true);
+                    update.fieldNames(), toPaimonType(update.newDataType()), true);
         } else if (change instanceof TableChange.UpdateColumnNullability) {
             TableChange.UpdateColumnNullability update =
                     (TableChange.UpdateColumnNullability) change;

From 4d32ed8b558d13ead30df74efe1941704c822bd8 Mon Sep 17 00:00:00 2001
From: wangwj <hongli.wwj@gmail.com>
Date: Tue, 12 Nov 2024 22:23:44 +0800
Subject: [PATCH 002/157] [core] FilesTable file_path col should be the path
 instead of name (#4503)

---
 .../org/apache/paimon/table/system/FilesTable.java    |  4 +++-
 .../apache/paimon/table/system/FilesTableTest.java    | 11 ++++++++++-
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
index 53d2078126737..0232fc2d2ddee 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
@@ -385,7 +385,9 @@ private LazyGenericRow toRow(
                                                         partitionConverter.convert(
                                                                 dataSplit.partition()))),
                         dataSplit::bucket,
-                        () -> BinaryString.fromString(dataFileMeta.fileName()),
+                        () ->
+                                BinaryString.fromString(
+                                        dataSplit.bucketPath() + "/" + dataFileMeta.fileName()),
                         () ->
                                 BinaryString.fromString(
                                         DataFilePathFactory.formatIdentifier(
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/system/FilesTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/system/FilesTableTest.java
index 1a692270ac5be..f0280560c2675 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/system/FilesTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/system/FilesTableTest.java
@@ -191,7 +191,16 @@ private List<InternalRow> getExpectedResult(long snapshotId) {
                             BinaryString.fromString(
                                     Arrays.toString(new String[] {partition1, partition2})),
                             fileEntry.bucket(),
-                            BinaryString.fromString(file.fileName()),
+                            BinaryString.fromString(
+                                    table.location()
+                                            + "/pt1="
+                                            + partition1
+                                            + "/pt2="
+                                            + partition2
+                                            + "/bucket-"
+                                            + fileEntry.bucket()
+                                            + "/"
+                                            + file.fileName()),
                             BinaryString.fromString(file.fileFormat()),
                             file.schemaId(),
                             file.level(),

From c3a83195f40ea33f07a447d4d39f98890e4a4334 Mon Sep 17 00:00:00 2001
From: Kerwin <37063904+zhuangchong@users.noreply.github.com>
Date: Tue, 12 Nov 2024 22:24:19 +0800
Subject: [PATCH 003/157] [doc] fix flink procedure document sql syntax error.
 (#4504)

---
 docs/content/flink/procedures.md             | 2 +-
 docs/content/maintenance/manage-snapshots.md | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/content/flink/procedures.md b/docs/content/flink/procedures.md
index d55a8daddef66..7e669a89d43bf 100644
--- a/docs/content/flink/procedures.md
+++ b/docs/content/flink/procedures.md
@@ -409,7 +409,7 @@ All available procedures are listed below.
       <td>expire_snapshots</td>
       <td>
          -- Use named argument<br/>
-         CALL [catalog.]sys.reset_consumer(<br/>
+         CALL [catalog.]sys.expire_snapshots(<br/>
             `table` => 'identifier', <br/>
             retain_max => 'retain_max', <br/>
             retain_min => 'retain_min', <br/>
diff --git a/docs/content/maintenance/manage-snapshots.md b/docs/content/maintenance/manage-snapshots.md
index eed0f72c08c2c..721d5d0bafb28 100644
--- a/docs/content/maintenance/manage-snapshots.md
+++ b/docs/content/maintenance/manage-snapshots.md
@@ -308,9 +308,9 @@ submit a `remove_orphan_files` job to clean them:
 
 {{< tab "Spark SQL/Flink SQL" >}}
 ```sql
-CALL sys.remove_orphan_files(`table` => "my_db.my_table", [older_than => "2023-10-31 12:00:00"])
+CALL sys.remove_orphan_files(`table` => 'my_db.my_table', [older_than => '2023-10-31 12:00:00'])
 
-CALL sys.remove_orphan_files(`table` => "my_db.*", [older_than => "2023-10-31 12:00:00"])
+CALL sys.remove_orphan_files(`table` => 'my_db.*', [older_than => '2023-10-31 12:00:00'])
 ```
 {{< /tab >}}
 

From 3ffeab94956882862802c2abfa73915e1789fe86 Mon Sep 17 00:00:00 2001
From: askwang <135721692+askwang@users.noreply.github.com>
Date: Wed, 13 Nov 2024 10:59:08 +0800
Subject: [PATCH 004/157] [doc] Remove unused config in record-level expire
 (#4509)

---
 docs/content/primary-key-table/compaction.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/content/primary-key-table/compaction.md b/docs/content/primary-key-table/compaction.md
index ada7e0289b359..bee8c16e46e9d 100644
--- a/docs/content/primary-key-table/compaction.md
+++ b/docs/content/primary-key-table/compaction.md
@@ -76,7 +76,6 @@ In compaction, you can configure record-Level expire time to expire records, you
 
 1. `'record-level.expire-time'`: time retain for records.
 2. `'record-level.time-field'`: time field for record level expire.
-3. `'record-level.time-field-type'`: time field type for record level expire, it can be seconds-int,seconds-long or millis-long.
 
 Expiration happens in compaction, and there is no strong guarantee to expire records in time.
 

From 5e3c24b89876eaa7d5a4d7783ac01b64a939fae7 Mon Sep 17 00:00:00 2001
From: askwang <135721692+askwang@users.noreply.github.com>
Date: Wed, 13 Nov 2024 11:19:56 +0800
Subject: [PATCH 005/157] [core] Adjust default value of
 'snapshot.expire.limit' (#4508)

---
 docs/layouts/shortcodes/generated/core_configuration.html      | 2 +-
 paimon-common/src/main/java/org/apache/paimon/CoreOptions.java | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 1305dfe9263b6..7287cacc2c53e 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -751,7 +751,7 @@
         </tr>
         <tr>
             <td><h5>snapshot.expire.limit</h5></td>
-            <td style="word-wrap: break-word;">10</td>
+            <td style="word-wrap: break-word;">50</td>
             <td>Integer</td>
             <td>The maximum number of snapshots allowed to expire at a time.</td>
         </tr>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index bb1661d6fd829..db603c5b61f06 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -315,7 +315,7 @@ public class CoreOptions implements Serializable {
     public static final ConfigOption<Integer> SNAPSHOT_EXPIRE_LIMIT =
             key("snapshot.expire.limit")
                     .intType()
-                    .defaultValue(10)
+                    .defaultValue(50)
                     .withDescription(
                             "The maximum number of snapshots allowed to expire at a time.");
 

From 72c25d58c575d4966fd2cb12fcc883071e393890 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 13 Nov 2024 11:27:07 +0800
Subject: [PATCH 006/157] [core] Add Table.uuid method (#4213)

---
 .../paimon/catalog/AbstractCatalog.java       | 32 +++++++++++++++++--
 .../apache/paimon/schema/SchemaManager.java   | 19 +++++++++++
 .../paimon/table/AbstractFileStoreTable.java  |  9 ++++++
 .../paimon/table/CatalogEnvironment.java      | 10 +++++-
 .../paimon/table/DelegatedFileStoreTable.java |  5 +++
 .../java/org/apache/paimon/table/Table.java   |  9 ++++++
 .../paimon/catalog/CatalogTestBase.java       | 12 +++++++
 .../org/apache/paimon/hive/HiveCatalog.java   | 19 +++++++++--
 8 files changed, 108 insertions(+), 7 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index a1cf941cda621..93018f12c9f1b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -424,16 +424,17 @@ public Table getTable(Identifier identifier) throws TableNotExistException {
 
     protected Table getDataOrFormatTable(Identifier identifier) throws TableNotExistException {
         Preconditions.checkArgument(identifier.getSystemTableName() == null);
-        TableSchema tableSchema = getDataTableSchema(identifier);
+        TableMeta tableMeta = getDataTableMeta(identifier);
         return FileStoreTableFactory.create(
                 fileIO,
                 getTableLocation(identifier),
-                tableSchema,
+                tableMeta.schema,
                 new CatalogEnvironment(
                         identifier,
+                        tableMeta.uuid,
                         Lock.factory(
                                 lockFactory().orElse(null), lockContext().orElse(null), identifier),
-                        metastoreClientFactory(identifier, tableSchema).orElse(null),
+                        metastoreClientFactory(identifier, tableMeta.schema).orElse(null),
                         lineageMetaFactory));
     }
 
@@ -475,6 +476,10 @@ public Map<String, Map<String, Path>> allTablePaths() {
         }
     }
 
+    protected TableMeta getDataTableMeta(Identifier identifier) throws TableNotExistException {
+        return new TableMeta(getDataTableSchema(identifier), null);
+    }
+
     protected abstract TableSchema getDataTableSchema(Identifier identifier)
             throws TableNotExistException;
 
@@ -627,4 +632,25 @@ public Optional<TableSchema> tableSchemaInFileSystem(Path tablePath, String bran
                             }
                         });
     }
+
+    /** Table metadata. */
+    protected static class TableMeta {
+
+        private final TableSchema schema;
+        @Nullable private final String uuid;
+
+        public TableMeta(TableSchema schema, @Nullable String uuid) {
+            this.schema = schema;
+            this.uuid = uuid;
+        }
+
+        public TableSchema schema() {
+            return schema;
+        }
+
+        @Nullable
+        public String uuid() {
+            return uuid;
+        }
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index 28cc69cf99d7b..86e365a88f831 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -78,6 +78,7 @@
 import static org.apache.paimon.catalog.Identifier.UNKNOWN_DATABASE;
 import static org.apache.paimon.utils.BranchManager.DEFAULT_MAIN_BRANCH;
 import static org.apache.paimon.utils.FileUtils.listVersionedFiles;
+import static org.apache.paimon.utils.Preconditions.checkArgument;
 import static org.apache.paimon.utils.Preconditions.checkState;
 
 /** Schema Manager to manage schema versions. */
@@ -123,6 +124,24 @@ public Optional<TableSchema> latest() {
         }
     }
 
+    public long earliestCreationTime() {
+        try {
+            long earliest = 0;
+            if (!schemaExists(0)) {
+                Optional<Long> min =
+                        listVersionedFiles(fileIO, schemaDirectory(), SCHEMA_PREFIX)
+                                .reduce(Math::min);
+                checkArgument(min.isPresent());
+                earliest = min.get();
+            }
+
+            Path schemaPath = toSchemaPath(earliest);
+            return fileIO.getFileStatus(schemaPath).getModificationTime();
+        } catch (IOException e) {
+            throw new UncheckedIOException(e);
+        }
+    }
+
     public List<TableSchema> listAll() {
         return listAllIds().stream().map(this::schema).collect(Collectors.toList());
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
index af0c3d71ec1ca..07c0e88645ac3 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
@@ -167,6 +167,15 @@ public Identifier identifier() {
                 : identifier;
     }
 
+    @Override
+    public String uuid() {
+        if (catalogEnvironment.uuid() != null) {
+            return catalogEnvironment.uuid();
+        }
+        long earliestCreationTime = schemaManager().earliestCreationTime();
+        return fullName() + "." + earliestCreationTime;
+    }
+
     @Override
     public Optional<Statistics> statistics() {
         Snapshot snapshot = TimeTravelUtil.resolveSnapshot(this);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java b/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
index ebaff12661556..9ff5f9b4f6a83 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
@@ -36,23 +36,26 @@ public class CatalogEnvironment implements Serializable {
     private static final long serialVersionUID = 1L;
 
     @Nullable private final Identifier identifier;
+    @Nullable private final String uuid;
     private final Lock.Factory lockFactory;
     @Nullable private final MetastoreClient.Factory metastoreClientFactory;
     @Nullable private final LineageMetaFactory lineageMetaFactory;
 
     public CatalogEnvironment(
             @Nullable Identifier identifier,
+            @Nullable String uuid,
             Lock.Factory lockFactory,
             @Nullable MetastoreClient.Factory metastoreClientFactory,
             @Nullable LineageMetaFactory lineageMetaFactory) {
         this.identifier = identifier;
+        this.uuid = uuid;
         this.lockFactory = lockFactory;
         this.metastoreClientFactory = metastoreClientFactory;
         this.lineageMetaFactory = lineageMetaFactory;
     }
 
     public static CatalogEnvironment empty() {
-        return new CatalogEnvironment(null, Lock.emptyFactory(), null, null);
+        return new CatalogEnvironment(null, null, Lock.emptyFactory(), null, null);
     }
 
     @Nullable
@@ -60,6 +63,11 @@ public Identifier identifier() {
         return identifier;
     }
 
+    @Nullable
+    public String uuid() {
+        return uuid;
+    }
+
     public Lock.Factory lockFactory() {
         return lockFactory;
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
index f6f3930baade8..2b369e5005cc4 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
@@ -72,6 +72,11 @@ public String fullName() {
         return wrapped.fullName();
     }
 
+    @Override
+    public String uuid() {
+        return wrapped.uuid();
+    }
+
     @Override
     public SnapshotReader newSnapshotReader() {
         return wrapped.newSnapshotReader();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/Table.java b/paimon-core/src/main/java/org/apache/paimon/table/Table.java
index db6848f5f1a84..7ed7ba48a8ebd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/Table.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/Table.java
@@ -52,10 +52,19 @@ public interface Table extends Serializable {
     /** A name to identify this table. */
     String name();
 
+    /** Full name of the table, default is database.tableName. */
     default String fullName() {
         return name();
     }
 
+    /**
+     * UUID of the table, metastore can provide the true UUID of this table, default is the full
+     * name.
+     */
+    default String uuid() {
+        return fullName();
+    }
+
     /** Returns the row type of this table. */
     RowType rowType();
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/CatalogTestBase.java b/paimon-core/src/test/java/org/apache/paimon/catalog/CatalogTestBase.java
index f130920a7c0e4..98a9b92c5c38c 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/CatalogTestBase.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/CatalogTestBase.java
@@ -948,4 +948,16 @@ public void testFormatTable() throws Exception {
                 .isInstanceOf(Catalog.TableNotExistException.class);
         assertThat(catalog.getTable(newIdentifier)).isInstanceOf(FormatTable.class);
     }
+
+    @Test
+    public void testTableUUID() throws Exception {
+        catalog.createDatabase("test_db", false);
+        Identifier identifier = Identifier.create("test_db", "test_table");
+        catalog.createTable(identifier, DEFAULT_TABLE_SCHEMA, false);
+        Table table = catalog.getTable(identifier);
+        String uuid = table.uuid();
+        assertThat(uuid).startsWith(identifier.getFullName() + ".");
+        assertThat(Long.parseLong(uuid.substring((identifier.getFullName() + ".").length())))
+                .isGreaterThan(0);
+    }
 }
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 2bf16c0f44b1d..8b8b62934dbdb 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -411,6 +411,18 @@ protected List<String> listTablesImpl(String databaseName) {
         }
     }
 
+    @Override
+    protected TableMeta getDataTableMeta(Identifier identifier) throws TableNotExistException {
+        return getDataTableMeta(identifier, getHmsTable(identifier));
+    }
+
+    private TableMeta getDataTableMeta(Identifier identifier, Table table)
+            throws TableNotExistException {
+        return new TableMeta(
+                getDataTableSchema(identifier, table),
+                identifier.getFullName() + "." + table.getCreateTime());
+    }
+
     @Override
     public TableSchema getDataTableSchema(Identifier identifier) throws TableNotExistException {
         Table table = getHmsTable(identifier);
@@ -567,18 +579,19 @@ public org.apache.paimon.table.Table getDataOrFormatTable(Identifier identifier)
         Preconditions.checkArgument(identifier.getSystemTableName() == null);
         Table table = getHmsTable(identifier);
         try {
-            TableSchema tableSchema = getDataTableSchema(identifier, table);
+            TableMeta tableMeta = getDataTableMeta(identifier, table);
             return FileStoreTableFactory.create(
                     fileIO,
                     getTableLocation(identifier, table),
-                    tableSchema,
+                    tableMeta.schema(),
                     new CatalogEnvironment(
                             identifier,
+                            tableMeta.uuid(),
                             Lock.factory(
                                     lockFactory().orElse(null),
                                     lockContext().orElse(null),
                                     identifier),
-                            metastoreClientFactory(identifier, tableSchema).orElse(null),
+                            metastoreClientFactory(identifier, tableMeta.schema()).orElse(null),
                             lineageMetaFactory));
         } catch (TableNotExistException ignore) {
         }

From 787a981cc2c009075d8c2aa5f3e2c66d5988aeeb Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Wed, 13 Nov 2024 11:32:13 +0800
Subject: [PATCH 007/157] [flink] Improve Exception message for consumer
 without expire time

---
 .../org/apache/paimon/flink/source/FlinkSourceBuilder.java  | 4 +++-
 .../java/org/apache/paimon/flink/CatalogTableITCase.java    | 6 ++++--
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
index ed94043c035d8..a648bfba607d4 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
@@ -259,7 +259,9 @@ public DataStream<RowData> build() {
         if (conf.contains(CoreOptions.CONSUMER_ID)
                 && !conf.contains(CoreOptions.CONSUMER_EXPIRATION_TIME)) {
             throw new IllegalArgumentException(
-                    "consumer.expiration-time should be specified when using consumer-id.");
+                    "You need to configure 'consumer.expiration-time' (ALTER TABLE) and restart your write job for it"
+                            + " to take effect, when you need consumer-id feature. This is to prevent consumers from leaving"
+                            + " too many snapshots that could pose a risk to the file system.");
         }
 
         if (sourceBounded) {
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
index ba063248ee460..8a3e068a72a02 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
@@ -972,7 +972,8 @@ public void testConsumerIdExpInBatchMode() {
                                         "SELECT * FROM T /*+ OPTIONS('consumer-id' = 'test-id') */ WHERE a = 1"))
                 .rootCause()
                 .isInstanceOf(IllegalArgumentException.class)
-                .hasMessage("consumer.expiration-time should be specified when using consumer-id.");
+                .hasMessageContaining(
+                        "You need to configure 'consumer.expiration-time' (ALTER TABLE) and restart your write job for it");
     }
 
     @Test
@@ -985,7 +986,8 @@ public void testConsumerIdExpInStreamingMode() {
                                 streamSqlIter(
                                         "SELECT * FROM T /*+ OPTIONS('consumer-id'='test-id') */"))
                 .isInstanceOf(IllegalArgumentException.class)
-                .hasMessage("consumer.expiration-time should be specified when using consumer-id.");
+                .hasMessageContaining(
+                        "You need to configure 'consumer.expiration-time' (ALTER TABLE) and restart your write job for it");
     }
 
     @Test

From 2b94a33bc1dc841476b8970d9a0bb69a7e85502e Mon Sep 17 00:00:00 2001
From: Tan-JiaLiang <tanjialiang1997@gmail.com>
Date: Wed, 13 Nov 2024 13:22:33 +0800
Subject: [PATCH 008/157] [core] Introduce bitmap index record reader (#4502)

---
 .../ApplyBitmapIndexFileRecordIterator.java   | 78 +++++++++++++++++
 .../bitmap/ApplyBitmapIndexRecordReader.java  | 64 ++++++++++++++
 .../apache/paimon/utils/RoaringBitmap32.java  |  4 +
 .../ApplyDeletionVectorReader.java            |  2 +-
 .../apache/paimon/io/FileIndexEvaluator.java  |  9 ++
 .../paimon/operation/RawFileSplitRead.java    | 10 ++-
 .../table/AppendOnlyFileStoreTableTest.java   | 11 +++
 .../table/PrimaryKeyFileStoreTableTest.java   | 87 +++++++++++++++++++
 8 files changed, 263 insertions(+), 2 deletions(-)
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexFileRecordIterator.java
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexFileRecordIterator.java b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexFileRecordIterator.java
new file mode 100644
index 0000000000000..eec931d3e98f8
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexFileRecordIterator.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.fileindex.bitmap;
+
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.utils.RoaringBitmap32;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+
+/**
+ * A {@link FileRecordIterator} wraps a {@link FileRecordIterator} and {@link BitmapIndexResult}.
+ */
+public class ApplyBitmapIndexFileRecordIterator implements FileRecordIterator<InternalRow> {
+
+    private final FileRecordIterator<InternalRow> iterator;
+    private final RoaringBitmap32 bitmap;
+    private final int last;
+
+    public ApplyBitmapIndexFileRecordIterator(
+            FileRecordIterator<InternalRow> iterator, BitmapIndexResult fileIndexResult) {
+        this.iterator = iterator;
+        this.bitmap = fileIndexResult.get();
+        this.last = bitmap.last();
+    }
+
+    @Override
+    public long returnedPosition() {
+        return iterator.returnedPosition();
+    }
+
+    @Override
+    public Path filePath() {
+        return iterator.filePath();
+    }
+
+    @Nullable
+    @Override
+    public InternalRow next() throws IOException {
+        while (true) {
+            InternalRow next = iterator.next();
+            if (next == null) {
+                return null;
+            }
+            int position = (int) returnedPosition();
+            if (position > last) {
+                return null;
+            }
+            if (bitmap.contains(position)) {
+                return next;
+            }
+        }
+    }
+
+    @Override
+    public void releaseBatch() {
+        iterator.releaseBatch();
+    }
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java
new file mode 100644
index 0000000000000..d5d15095f2eda
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java
@@ -0,0 +1,64 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.fileindex.bitmap;
+
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.RecordReader;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+
+import static org.apache.paimon.utils.Preconditions.checkArgument;
+
+/** A {@link RecordReader} which apply {@link BitmapIndexResult} to filter record. */
+public class ApplyBitmapIndexRecordReader implements RecordReader<InternalRow> {
+
+    private final RecordReader<InternalRow> reader;
+
+    private final BitmapIndexResult fileIndexResult;
+
+    public ApplyBitmapIndexRecordReader(
+            RecordReader<InternalRow> reader, BitmapIndexResult fileIndexResult) {
+        this.reader = reader;
+        this.fileIndexResult = fileIndexResult;
+    }
+
+    @Nullable
+    @Override
+    public RecordIterator<InternalRow> readBatch() throws IOException {
+        RecordIterator<InternalRow> batch = reader.readBatch();
+        if (batch == null) {
+            return null;
+        }
+
+        checkArgument(
+                batch instanceof FileRecordIterator,
+                "There is a bug, RecordIterator in ApplyBitmapIndexRecordReader must be FileRecordIterator");
+
+        return new ApplyBitmapIndexFileRecordIterator(
+                (FileRecordIterator<InternalRow>) batch, fileIndexResult);
+    }
+
+    @Override
+    public void close() throws IOException {
+        reader.close();
+    }
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/RoaringBitmap32.java b/paimon-common/src/main/java/org/apache/paimon/utils/RoaringBitmap32.java
index 1d3468a9fcdb3..5f352f61cd3c6 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/RoaringBitmap32.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/RoaringBitmap32.java
@@ -72,6 +72,10 @@ public long rangeCardinality(long start, long end) {
         return roaringBitmap.rangeCardinality(start, end);
     }
 
+    public int last() {
+        return roaringBitmap.last();
+    }
+
     public RoaringBitmap32 clone() {
         return new RoaringBitmap32(roaringBitmap.clone());
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
index 18ab033fb2762..c1dc16a78d950 100644
--- a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
@@ -60,7 +60,7 @@ public RecordIterator<InternalRow> readBatch() throws IOException {
 
         checkArgument(
                 batch instanceof FileRecordIterator,
-                "There is a bug, RecordIterator in ApplyDeletionVectorReader must be RecordWithPositionIterator");
+                "There is a bug, RecordIterator in ApplyDeletionVectorReader must be FileRecordIterator");
 
         return new ApplyDeletionFileRecordIterator(
                 (FileRecordIterator<InternalRow>) batch, deletionVector);
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/FileIndexEvaluator.java b/paimon-core/src/main/java/org/apache/paimon/io/FileIndexEvaluator.java
index c34d1b0d3ba75..530b87165322f 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/FileIndexEvaluator.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/FileIndexEvaluator.java
@@ -40,6 +40,15 @@ public static FileIndexResult evaluate(
             DataFileMeta file)
             throws IOException {
         if (dataFilter != null && !dataFilter.isEmpty()) {
+            byte[] embeddedIndex = file.embeddedIndex();
+            if (embeddedIndex != null) {
+                try (FileIndexPredicate predicate =
+                        new FileIndexPredicate(embeddedIndex, dataSchema.logicalRowType())) {
+                    return predicate.evaluate(
+                            PredicateBuilder.and(dataFilter.toArray(new Predicate[0])));
+                }
+            }
+
             List<String> indexFiles =
                     file.extraFiles().stream()
                             .filter(name -> name.endsWith(DataFilePathFactory.INDEX_PATH_SUFFIX))
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
index 9c612a9f8cf06..4a6fa5b3db7f2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
@@ -24,6 +24,8 @@
 import org.apache.paimon.deletionvectors.DeletionVector;
 import org.apache.paimon.disk.IOManager;
 import org.apache.paimon.fileindex.FileIndexResult;
+import org.apache.paimon.fileindex.bitmap.ApplyBitmapIndexRecordReader;
+import org.apache.paimon.fileindex.bitmap.BitmapIndexResult;
 import org.apache.paimon.format.FileFormatDiscover;
 import org.apache.paimon.format.FormatKey;
 import org.apache.paimon.format.FormatReaderContext;
@@ -212,7 +214,7 @@ private RecordReader<InternalRow> createFileReader(
                         dataFilePathFactory.toPath(file.fileName()),
                         file.fileSize(),
                         fileIndexResult);
-        FileRecordReader fileRecordReader =
+        RecordReader<InternalRow> fileRecordReader =
                 new FileRecordReader(
                         bulkFormatMapping.getReaderFactory(),
                         formatReaderContext,
@@ -220,6 +222,12 @@ private RecordReader<InternalRow> createFileReader(
                         bulkFormatMapping.getCastMapping(),
                         PartitionUtils.create(bulkFormatMapping.getPartitionPair(), partition));
 
+        if (fileIndexResult instanceof BitmapIndexResult) {
+            fileRecordReader =
+                    new ApplyBitmapIndexRecordReader(
+                            fileRecordReader, (BitmapIndexResult) fileIndexResult);
+        }
+
         DeletionVector deletionVector = dvFactory == null ? null : dvFactory.get();
         if (deletionVector != null && !deletionVector.isEmpty()) {
             return new ApplyDeletionVectorReader(fileRecordReader, deletionVector);
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
index 81dd30262058a..0328cc6bada34 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
@@ -79,6 +79,7 @@
 import static org.apache.paimon.CoreOptions.BUCKET;
 import static org.apache.paimon.CoreOptions.BUCKET_KEY;
 import static org.apache.paimon.CoreOptions.FILE_INDEX_IN_MANIFEST_THRESHOLD;
+import static org.apache.paimon.CoreOptions.METADATA_STATS_MODE;
 import static org.apache.paimon.io.DataFileTestUtils.row;
 import static org.apache.paimon.table.sink.KeyAndBucketExtractor.bucket;
 import static org.apache.paimon.table.sink.KeyAndBucketExtractor.bucketKeyHashCode;
@@ -574,6 +575,7 @@ public void testBSIAndBitmapIndexInMemory() throws Exception {
                 createUnawareBucketFileStoreTable(
                         rowType,
                         options -> {
+                            options.set(METADATA_STATS_MODE, "NONE");
                             options.set(
                                     FileIndexOptions.FILE_INDEX
                                             + "."
@@ -600,7 +602,11 @@ public void testBSIAndBitmapIndexInMemory() throws Exception {
         write.write(GenericRow.of(1, BinaryString.fromString("B"), 3L));
         write.write(GenericRow.of(1, BinaryString.fromString("C"), 3L));
         result.addAll(write.prepareCommit(true, 0));
+        write.write(GenericRow.of(1, BinaryString.fromString("A"), 4L));
+        write.write(GenericRow.of(1, BinaryString.fromString("B"), 3L));
         write.write(GenericRow.of(1, BinaryString.fromString("C"), 4L));
+        write.write(GenericRow.of(1, BinaryString.fromString("D"), 2L));
+        write.write(GenericRow.of(1, BinaryString.fromString("D"), 4L));
         result.addAll(write.prepareCommit(true, 0));
         commit.commit(0, result);
         result.clear();
@@ -639,6 +645,7 @@ public void testBSIAndBitmapIndexInDisk() throws Exception {
                 createUnawareBucketFileStoreTable(
                         rowType,
                         options -> {
+                            options.set(METADATA_STATS_MODE, "NONE");
                             options.set(
                                     FileIndexOptions.FILE_INDEX
                                             + "."
@@ -665,7 +672,11 @@ public void testBSIAndBitmapIndexInDisk() throws Exception {
         write.write(GenericRow.of(1, BinaryString.fromString("B"), 3L));
         write.write(GenericRow.of(1, BinaryString.fromString("C"), 3L));
         result.addAll(write.prepareCommit(true, 0));
+        write.write(GenericRow.of(1, BinaryString.fromString("A"), 4L));
+        write.write(GenericRow.of(1, BinaryString.fromString("B"), 3L));
         write.write(GenericRow.of(1, BinaryString.fromString("C"), 4L));
+        write.write(GenericRow.of(1, BinaryString.fromString("D"), 2L));
+        write.write(GenericRow.of(1, BinaryString.fromString("D"), 4L));
         result.addAll(write.prepareCommit(true, 0));
         commit.commit(0, result);
         result.clear();
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index dca86aa61ec28..4917d076014a9 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -99,6 +99,7 @@
 import static org.apache.paimon.CoreOptions.ChangelogProducer.LOOKUP;
 import static org.apache.paimon.CoreOptions.DELETION_VECTORS_ENABLED;
 import static org.apache.paimon.CoreOptions.FILE_FORMAT;
+import static org.apache.paimon.CoreOptions.FILE_INDEX_IN_MANIFEST_THRESHOLD;
 import static org.apache.paimon.CoreOptions.LOOKUP_LOCAL_FILE_TYPE;
 import static org.apache.paimon.CoreOptions.MERGE_ENGINE;
 import static org.apache.paimon.CoreOptions.MergeEngine;
@@ -862,6 +863,92 @@ public void testDeletionVectorsWithFileIndexInMeta() throws Exception {
         assertThat(((DataSplit) splits.get(0)).dataFiles().size()).isEqualTo(1);
     }
 
+    @Test
+    public void testDeletionVectorsWithBitmapFileIndexInFile() throws Exception {
+        FileStoreTable table =
+                createFileStoreTable(
+                        conf -> {
+                            conf.set(BUCKET, 1);
+                            conf.set(DELETION_VECTORS_ENABLED, true);
+                            conf.set(TARGET_FILE_SIZE, MemorySize.ofBytes(1));
+                            conf.set(FILE_INDEX_IN_MANIFEST_THRESHOLD, MemorySize.ofBytes(1));
+                            conf.set("file-index.bitmap.columns", "b");
+                        });
+
+        StreamTableWrite write =
+                table.newWrite(commitUser).withIOManager(new IOManagerImpl(tempDir.toString()));
+        StreamTableCommit commit = table.newCommit(commitUser);
+
+        write.write(rowData(1, 1, 300L));
+        write.write(rowData(1, 2, 400L));
+        write.write(rowData(1, 3, 100L));
+        write.write(rowData(1, 4, 100L));
+        commit.commit(0, write.prepareCommit(true, 0));
+
+        write.write(rowData(1, 1, 100L));
+        write.write(rowData(1, 2, 100L));
+        write.write(rowData(1, 3, 300L));
+        write.write(rowData(1, 5, 100L));
+        commit.commit(1, write.prepareCommit(true, 1));
+
+        write.write(rowData(1, 4, 200L));
+        commit.commit(2, write.prepareCommit(true, 2));
+
+        PredicateBuilder builder = new PredicateBuilder(ROW_TYPE);
+        List<Split> splits = toSplits(table.newSnapshotReader().read().dataSplits());
+        assertThat(((DataSplit) splits.get(0)).dataFiles().size()).isEqualTo(2);
+        TableRead read = table.newRead().withFilter(builder.equal(2, 100L));
+        assertThat(getResult(read, splits, BATCH_ROW_TO_STRING))
+                .hasSameElementsAs(
+                        Arrays.asList(
+                                "1|1|100|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|2|100|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|5|100|binary|varbinary|mapKey:mapVal|multiset"));
+    }
+
+    @Test
+    public void testDeletionVectorsWithBitmapFileIndexInMeta() throws Exception {
+        FileStoreTable table =
+                createFileStoreTable(
+                        conf -> {
+                            conf.set(BUCKET, 1);
+                            conf.set(DELETION_VECTORS_ENABLED, true);
+                            conf.set(TARGET_FILE_SIZE, MemorySize.ofBytes(1));
+                            conf.set(FILE_INDEX_IN_MANIFEST_THRESHOLD, MemorySize.ofMebiBytes(1));
+                            conf.set("file-index.bitmap.columns", "b");
+                        });
+
+        StreamTableWrite write =
+                table.newWrite(commitUser).withIOManager(new IOManagerImpl(tempDir.toString()));
+        StreamTableCommit commit = table.newCommit(commitUser);
+
+        write.write(rowData(1, 1, 300L));
+        write.write(rowData(1, 2, 400L));
+        write.write(rowData(1, 3, 100L));
+        write.write(rowData(1, 4, 100L));
+        commit.commit(0, write.prepareCommit(true, 0));
+
+        write.write(rowData(1, 1, 100L));
+        write.write(rowData(1, 2, 100L));
+        write.write(rowData(1, 3, 300L));
+        write.write(rowData(1, 5, 100L));
+        commit.commit(1, write.prepareCommit(true, 1));
+
+        write.write(rowData(1, 4, 200L));
+        commit.commit(2, write.prepareCommit(true, 2));
+
+        PredicateBuilder builder = new PredicateBuilder(ROW_TYPE);
+        List<Split> splits = toSplits(table.newSnapshotReader().read().dataSplits());
+        assertThat(((DataSplit) splits.get(0)).dataFiles().size()).isEqualTo(2);
+        TableRead read = table.newRead().withFilter(builder.equal(2, 100L));
+        assertThat(getResult(read, splits, BATCH_ROW_TO_STRING))
+                .hasSameElementsAs(
+                        Arrays.asList(
+                                "1|1|100|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|2|100|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|5|100|binary|varbinary|mapKey:mapVal|multiset"));
+    }
+
     @Test
     public void testWithShardFirstRow() throws Exception {
         FileStoreTable table =

From d16287eb16f45f0de0eba243cf9a5517d54d88a9 Mon Sep 17 00:00:00 2001
From: wangkang <kandy01.wang@vipshop.com>
Date: Wed, 13 Nov 2024 15:42:20 +0800
Subject: [PATCH 009/157] [doc] Update hll_sketch and theta_sketch in
 aggregation.md (#4518)

---
 .../primary-key-table/merge-engine/aggregation.md      | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/docs/content/primary-key-table/merge-engine/aggregation.md b/docs/content/primary-key-table/merge-engine/aggregation.md
index fa667ed356871..0cc6507f2b4ce 100644
--- a/docs/content/primary-key-table/merge-engine/aggregation.md
+++ b/docs/content/primary-key-table/merge-engine/aggregation.md
@@ -247,16 +247,17 @@ An example:
     uv VARBINARY
   ) WITH (
     'merge-engine' = 'aggregation',
-    'fields.f0.aggregate-function' = 'hll_sketch'
+    'fields.uv.aggregate-function' = 'hll_sketch'
   );
   
   -- Register the following class as a Flink function with the name "HLL_SKETCH" 
+  -- for example: create TEMPORARY function HLL_SKETCH as  'HllSketchFunction';
   -- which is used to transform input to sketch bytes array:
   --
   -- public static class HllSketchFunction extends ScalarFunction {
   --   public byte[] eval(String user_id) {
   --     HllSketch hllSketch = new HllSketch();
-  --     hllSketch.update(id);
+  --     hllSketch.update(user_id);
   --     return hllSketch.toCompactByteArray();
   --   }
   -- }
@@ -264,6 +265,7 @@ An example:
   INSERT INTO UV_AGG SELECT id, HLL_SKETCH(user_id) FROM VISITS;
 
   -- Register the following class as a Flink function with the name "HLL_SKETCH_COUNT"
+  -- for example: create TEMPORARY function HLL_SKETCH_COUNT as  'HllSketchCountFunction';
   -- which is used to get cardinality from sketch bytes array:
   -- 
   -- public static class HllSketchCountFunction extends ScalarFunction { 
@@ -307,10 +309,11 @@ An example:
     uv VARBINARY
   ) WITH (
     'merge-engine' = 'aggregation',
-    'fields.f0.aggregate-function' = 'theta_sketch'
+    'fields.uv.aggregate-function' = 'theta_sketch'
   );
   
   -- Register the following class as a Flink function with the name "THETA_SKETCH" 
+  -- for example: create TEMPORARY function THETA_SKETCH as  'ThetaSketchFunction';
   -- which is used to transform input to sketch bytes array:
   --
   -- public static class ThetaSketchFunction extends ScalarFunction {
@@ -324,6 +327,7 @@ An example:
   INSERT INTO UV_AGG SELECT id, THETA_SKETCH(user_id) FROM VISITS;
 
   -- Register the following class as a Flink function with the name "THETA_SKETCH_COUNT"
+  -- for example: create TEMPORARY function THETA_SKETCH_COUNT as  'ThetaSketchCountFunction';
   -- which is used to get cardinality from sketch bytes array:
   -- 
   -- public static class ThetaSketchCountFunction extends ScalarFunction { 

From bbba0171423983714c106e4e62a050f757ecdc12 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 13 Nov 2024 15:43:16 +0800
Subject: [PATCH 010/157] [core] Make FormatReaderFactory return
 FileRecordReader to reduce cast (#4512)

---
 .../bitmap/ApplyBitmapIndexRecordReader.java  | 20 +++-----
 .../paimon/format/FormatReaderFactory.java    |  3 +-
 .../paimon/reader/EmptyFileRecordReader.java  | 36 ++++++++++++++
 .../paimon/reader/FileRecordIterator.java     |  4 +-
 .../paimon/reader/FileRecordReader.java       | 31 ++++++++++++
 .../ApplyDeletionVectorReader.java            | 20 +++-----
 ...dReader.java => DataFileRecordReader.java} | 47 ++++++++++---------
 .../io/KeyValueDataFileRecordReader.java      | 12 +++--
 .../paimon/io/KeyValueFileReaderFactory.java  |  7 +--
 .../paimon/operation/RawFileSplitRead.java    | 13 ++---
 ...CompactedChangelogFormatReaderFactory.java |  4 +-
 .../paimon/format/avro/AvroBulkFormat.java    |  8 ++--
 .../paimon/format/orc/OrcReaderFactory.java   |  8 ++--
 .../format/parquet/ParquetReaderFactory.java  |  9 ++--
 14 files changed, 140 insertions(+), 82 deletions(-)
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/reader/EmptyFileRecordReader.java
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/reader/FileRecordReader.java
 rename paimon-core/src/main/java/org/apache/paimon/io/{FileRecordReader.java => DataFileRecordReader.java} (88%)

diff --git a/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java
index d5d15095f2eda..3b1207c8bd6e5 100644
--- a/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java
+++ b/paimon-common/src/main/java/org/apache/paimon/fileindex/bitmap/ApplyBitmapIndexRecordReader.java
@@ -20,41 +20,35 @@
 
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 
 import javax.annotation.Nullable;
 
 import java.io.IOException;
 
-import static org.apache.paimon.utils.Preconditions.checkArgument;
-
 /** A {@link RecordReader} which apply {@link BitmapIndexResult} to filter record. */
-public class ApplyBitmapIndexRecordReader implements RecordReader<InternalRow> {
+public class ApplyBitmapIndexRecordReader implements FileRecordReader<InternalRow> {
 
-    private final RecordReader<InternalRow> reader;
+    private final FileRecordReader<InternalRow> reader;
 
     private final BitmapIndexResult fileIndexResult;
 
     public ApplyBitmapIndexRecordReader(
-            RecordReader<InternalRow> reader, BitmapIndexResult fileIndexResult) {
+            FileRecordReader<InternalRow> reader, BitmapIndexResult fileIndexResult) {
         this.reader = reader;
         this.fileIndexResult = fileIndexResult;
     }
 
     @Nullable
     @Override
-    public RecordIterator<InternalRow> readBatch() throws IOException {
-        RecordIterator<InternalRow> batch = reader.readBatch();
+    public FileRecordIterator<InternalRow> readBatch() throws IOException {
+        FileRecordIterator<InternalRow> batch = reader.readBatch();
         if (batch == null) {
             return null;
         }
 
-        checkArgument(
-                batch instanceof FileRecordIterator,
-                "There is a bug, RecordIterator in ApplyBitmapIndexRecordReader must be FileRecordIterator");
-
-        return new ApplyBitmapIndexFileRecordIterator(
-                (FileRecordIterator<InternalRow>) batch, fileIndexResult);
+        return new ApplyBitmapIndexFileRecordIterator(batch, fileIndexResult);
     }
 
     @Override
diff --git a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
index 420d44e0f61d9..d8af3e2fe37ca 100644
--- a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
+++ b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.fileindex.FileIndexResult;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 
 import java.io.IOException;
@@ -29,7 +30,7 @@
 /** A factory to create {@link RecordReader} for file. */
 public interface FormatReaderFactory {
 
-    RecordReader<InternalRow> createReader(Context context) throws IOException;
+    FileRecordReader<InternalRow> createReader(Context context) throws IOException;
 
     /** Context for creating reader. */
     interface Context {
diff --git a/paimon-common/src/main/java/org/apache/paimon/reader/EmptyFileRecordReader.java b/paimon-common/src/main/java/org/apache/paimon/reader/EmptyFileRecordReader.java
new file mode 100644
index 0000000000000..3fa25dce5c490
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/reader/EmptyFileRecordReader.java
@@ -0,0 +1,36 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.reader;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+
+/** An empty {@link FileRecordReader}. */
+public class EmptyFileRecordReader<T> implements FileRecordReader<T> {
+
+    @Nullable
+    @Override
+    public FileRecordIterator<T> readBatch() throws IOException {
+        return null;
+    }
+
+    @Override
+    public void close() throws IOException {}
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordIterator.java b/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordIterator.java
index d22b27053f986..2d3c85f193dcf 100644
--- a/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordIterator.java
+++ b/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordIterator.java
@@ -27,10 +27,8 @@
 import java.util.function.Function;
 
 /**
- * Wrap {@link RecordReader.RecordIterator} to support returning the record's row position and file
+ * A {@link RecordReader.RecordIterator} to support returning the record's row position and file
  * Path.
- *
- * @param <T> The type of the record.
  */
 public interface FileRecordIterator<T> extends RecordReader.RecordIterator<T> {
 
diff --git a/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordReader.java b/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordReader.java
new file mode 100644
index 0000000000000..4d5356edf2757
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/reader/FileRecordReader.java
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.reader;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+
+/** A {@link RecordReader} to support returning {@link FileRecordIterator}. */
+public interface FileRecordReader<T> extends RecordReader<T> {
+
+    @Override
+    @Nullable
+    FileRecordIterator<T> readBatch() throws IOException;
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
index c1dc16a78d950..2fc292e54d340 100644
--- a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/ApplyDeletionVectorReader.java
@@ -20,23 +20,22 @@
 
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 
 import javax.annotation.Nullable;
 
 import java.io.IOException;
 
-import static org.apache.paimon.utils.Preconditions.checkArgument;
-
 /** A {@link RecordReader} which apply {@link DeletionVector} to filter record. */
-public class ApplyDeletionVectorReader implements RecordReader<InternalRow> {
+public class ApplyDeletionVectorReader implements FileRecordReader<InternalRow> {
 
-    private final RecordReader<InternalRow> reader;
+    private final FileRecordReader<InternalRow> reader;
 
     private final DeletionVector deletionVector;
 
     public ApplyDeletionVectorReader(
-            RecordReader<InternalRow> reader, DeletionVector deletionVector) {
+            FileRecordReader<InternalRow> reader, DeletionVector deletionVector) {
         this.reader = reader;
         this.deletionVector = deletionVector;
     }
@@ -51,19 +50,14 @@ public DeletionVector deletionVector() {
 
     @Nullable
     @Override
-    public RecordIterator<InternalRow> readBatch() throws IOException {
-        RecordIterator<InternalRow> batch = reader.readBatch();
+    public FileRecordIterator<InternalRow> readBatch() throws IOException {
+        FileRecordIterator<InternalRow> batch = reader.readBatch();
 
         if (batch == null) {
             return null;
         }
 
-        checkArgument(
-                batch instanceof FileRecordIterator,
-                "There is a bug, RecordIterator in ApplyDeletionVectorReader must be FileRecordIterator");
-
-        return new ApplyDeletionFileRecordIterator(
-                (FileRecordIterator<InternalRow>) batch, deletionVector);
+        return new ApplyDeletionFileRecordIterator(batch, deletionVector);
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/FileRecordReader.java b/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
similarity index 88%
rename from paimon-core/src/main/java/org/apache/paimon/io/FileRecordReader.java
rename to paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
index 1e12025ba5330..d2559fe6240b2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/FileRecordReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
@@ -25,7 +25,8 @@
 import org.apache.paimon.data.PartitionInfo;
 import org.apache.paimon.data.columnar.ColumnarRowIterator;
 import org.apache.paimon.format.FormatReaderFactory;
-import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.utils.FileUtils;
 import org.apache.paimon.utils.ProjectedRow;
 
@@ -34,17 +35,35 @@
 import java.io.IOException;
 
 /** Reads {@link InternalRow} from data files. */
-public class FileRecordReader implements RecordReader<InternalRow> {
+public class DataFileRecordReader implements FileRecordReader<InternalRow> {
 
-    private final RecordReader<InternalRow> reader;
+    private final FileRecordReader<InternalRow> reader;
     @Nullable private final int[] indexMapping;
     @Nullable private final PartitionInfo partitionInfo;
     @Nullable private final CastFieldGetter[] castMapping;
 
+    public DataFileRecordReader(
+            FormatReaderFactory readerFactory,
+            FormatReaderFactory.Context context,
+            @Nullable int[] indexMapping,
+            @Nullable CastFieldGetter[] castMapping,
+            @Nullable PartitionInfo partitionInfo)
+            throws IOException {
+        try {
+            this.reader = readerFactory.createReader(context);
+        } catch (Exception e) {
+            FileUtils.checkExists(context.fileIO(), context.filePath());
+            throw e;
+        }
+        this.indexMapping = indexMapping;
+        this.partitionInfo = partitionInfo;
+        this.castMapping = castMapping;
+    }
+
     @Nullable
     @Override
-    public RecordReader.RecordIterator<InternalRow> readBatch() throws IOException {
-        RecordIterator<InternalRow> iterator = reader.readBatch();
+    public FileRecordIterator<InternalRow> readBatch() throws IOException {
+        FileRecordIterator<InternalRow> iterator = reader.readBatch();
         if (iterator == null) {
             return null;
         }
@@ -71,24 +90,6 @@ public RecordReader.RecordIterator<InternalRow> readBatch() throws IOException {
         return iterator;
     }
 
-    public FileRecordReader(
-            FormatReaderFactory readerFactory,
-            FormatReaderFactory.Context context,
-            @Nullable int[] indexMapping,
-            @Nullable CastFieldGetter[] castMapping,
-            @Nullable PartitionInfo partitionInfo)
-            throws IOException {
-        try {
-            this.reader = readerFactory.createReader(context);
-        } catch (Exception e) {
-            FileUtils.checkExists(context.fileIO(), context.filePath());
-            throw e;
-        }
-        this.indexMapping = indexMapping;
-        this.partitionInfo = partitionInfo;
-        this.castMapping = castMapping;
-    }
-
     @Override
     public void close() throws IOException {
         reader.close();
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileRecordReader.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileRecordReader.java
index e44ad79ff53ee..6cf08769703fc 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileRecordReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileRecordReader.java
@@ -21,6 +21,8 @@
 import org.apache.paimon.KeyValue;
 import org.apache.paimon.KeyValueSerializer;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 import org.apache.paimon.types.RowType;
 
@@ -29,14 +31,14 @@
 import java.io.IOException;
 
 /** {@link RecordReader} for reading {@link KeyValue} data files. */
-public class KeyValueDataFileRecordReader implements RecordReader<KeyValue> {
+public class KeyValueDataFileRecordReader implements FileRecordReader<KeyValue> {
 
-    private final RecordReader<InternalRow> reader;
+    private final FileRecordReader<InternalRow> reader;
     private final KeyValueSerializer serializer;
     private final int level;
 
     public KeyValueDataFileRecordReader(
-            RecordReader<InternalRow> reader, RowType keyType, RowType valueType, int level) {
+            FileRecordReader<InternalRow> reader, RowType keyType, RowType valueType, int level) {
         this.reader = reader;
         this.serializer = new KeyValueSerializer(keyType, valueType);
         this.level = level;
@@ -44,8 +46,8 @@ public KeyValueDataFileRecordReader(
 
     @Nullable
     @Override
-    public RecordIterator<KeyValue> readBatch() throws IOException {
-        RecordReader.RecordIterator<InternalRow> iterator = reader.readBatch();
+    public FileRecordIterator<KeyValue> readBatch() throws IOException {
+        FileRecordIterator<InternalRow> iterator = reader.readBatch();
         if (iterator == null) {
             return null;
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
index fdbb727e56747..7d3acd729c55a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
@@ -32,6 +32,7 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.partition.PartitionUtils;
 import org.apache.paimon.predicate.Predicate;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 import org.apache.paimon.schema.KeyValueFieldsExtractor;
 import org.apache.paimon.schema.SchemaManager;
@@ -109,7 +110,7 @@ public RecordReader<KeyValue> createRecordReader(
         return createRecordReader(schemaId, fileName, level, true, null, fileSize);
     }
 
-    private RecordReader<KeyValue> createRecordReader(
+    private FileRecordReader<KeyValue> createRecordReader(
             long schemaId,
             String fileName,
             int level,
@@ -134,8 +135,8 @@ private RecordReader<KeyValue> createRecordReader(
                         : formatSupplier.get();
         Path filePath = pathFactory.toPath(fileName);
 
-        RecordReader<InternalRow> fileRecordReader =
-                new FileRecordReader(
+        FileRecordReader<InternalRow> fileRecordReader =
+                new DataFileRecordReader(
                         bulkFormatMapping.getReaderFactory(),
                         orcPoolSize == null
                                 ? new FormatReaderContext(fileIO, filePath, fileSize)
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
index 4a6fa5b3db7f2..46977457c4be5 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
@@ -32,12 +32,13 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.DataFilePathFactory;
+import org.apache.paimon.io.DataFileRecordReader;
 import org.apache.paimon.io.FileIndexEvaluator;
-import org.apache.paimon.io.FileRecordReader;
 import org.apache.paimon.mergetree.compact.ConcatRecordReader;
 import org.apache.paimon.partition.PartitionUtils;
 import org.apache.paimon.predicate.Predicate;
-import org.apache.paimon.reader.EmptyRecordReader;
+import org.apache.paimon.reader.EmptyFileRecordReader;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.ReaderSupplier;
 import org.apache.paimon.reader.RecordReader;
 import org.apache.paimon.schema.SchemaManager;
@@ -187,7 +188,7 @@ public RecordReader<InternalRow> createReader(
         return ConcatRecordReader.create(suppliers);
     }
 
-    private RecordReader<InternalRow> createFileReader(
+    private FileRecordReader<InternalRow> createFileReader(
             BinaryRow partition,
             DataFileMeta file,
             DataFilePathFactory dataFilePathFactory,
@@ -204,7 +205,7 @@ private RecordReader<InternalRow> createFileReader(
                             dataFilePathFactory,
                             file);
             if (!fileIndexResult.remain()) {
-                return new EmptyRecordReader<>();
+                return new EmptyFileRecordReader<>();
             }
         }
 
@@ -214,8 +215,8 @@ private RecordReader<InternalRow> createFileReader(
                         dataFilePathFactory.toPath(file.fileName()),
                         file.fileSize(),
                         fileIndexResult);
-        RecordReader<InternalRow> fileRecordReader =
-                new FileRecordReader(
+        FileRecordReader<InternalRow> fileRecordReader =
+                new DataFileRecordReader(
                         bulkFormatMapping.getReaderFactory(),
                         formatReaderContext,
                         bulkFormatMapping.getIndexMapping(),
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/format/CompactedChangelogFormatReaderFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/format/CompactedChangelogFormatReaderFactory.java
index e17566f302cdc..e0aed448db93c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/format/CompactedChangelogFormatReaderFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/format/CompactedChangelogFormatReaderFactory.java
@@ -27,7 +27,7 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.PositionOutputStream;
 import org.apache.paimon.fs.SeekableInputStream;
-import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.reader.FileRecordReader;
 
 import java.io.EOFException;
 import java.io.IOException;
@@ -60,7 +60,7 @@ public CompactedChangelogFormatReaderFactory(FormatReaderFactory wrapped) {
     }
 
     @Override
-    public RecordReader<InternalRow> createReader(Context context) throws IOException {
+    public FileRecordReader<InternalRow> createReader(Context context) throws IOException {
         OffsetReadOnlyFileIO fileIO = new OffsetReadOnlyFileIO(context.fileIO());
         long length = decodePath(context.filePath()).length;
 
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroBulkFormat.java b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroBulkFormat.java
index 7f3e275183cf3..a06ca9948c444 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroBulkFormat.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroBulkFormat.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
-import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.IOUtils;
 import org.apache.paimon.utils.IteratorResultIterator;
@@ -49,12 +49,12 @@ public AvroBulkFormat(RowType projectedRowType) {
     }
 
     @Override
-    public RecordReader<InternalRow> createReader(FormatReaderFactory.Context context)
+    public FileRecordReader<InternalRow> createReader(FormatReaderFactory.Context context)
             throws IOException {
         return new AvroReader(context.fileIO(), context.filePath(), context.fileSize());
     }
 
-    private class AvroReader implements RecordReader<InternalRow> {
+    private class AvroReader implements FileRecordReader<InternalRow> {
 
         private final FileIO fileIO;
         private final DataFileReader<InternalRow> reader;
@@ -90,7 +90,7 @@ private DataFileReader<InternalRow> createReaderFromPath(Path path, long fileSiz
 
         @Nullable
         @Override
-        public RecordIterator<InternalRow> readBatch() throws IOException {
+        public IteratorResultIterator readBatch() throws IOException {
             Object ticket;
             try {
                 ticket = pool.pollEntry();
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
index dbc5de265c492..05f3dd7851e84 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
@@ -30,6 +30,7 @@
 import org.apache.paimon.format.orc.filter.OrcFilters;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader.RecordIterator;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.RowType;
@@ -184,7 +185,7 @@ public VectorizedRowBatch orcVectorizedRowBatch() {
             return orcVectorizedRowBatch;
         }
 
-        private RecordIterator<InternalRow> convertAndGetIterator(
+        private ColumnarRowIterator convertAndGetIterator(
                 VectorizedRowBatch orcBatch, long rowNumber) {
             // no copying from the ORC column vectors to the Paimon columns vectors necessary,
             // because they point to the same data arrays internally design
@@ -209,8 +210,7 @@ private RecordIterator<InternalRow> convertAndGetIterator(
      * batch is addressed by the starting row number of the batch, plus the number of records to be
      * skipped before.
      */
-    private static final class OrcVectorizedReader
-            implements org.apache.paimon.reader.RecordReader<InternalRow> {
+    private static final class OrcVectorizedReader implements FileRecordReader<InternalRow> {
 
         private final RecordReader orcReader;
         private final Pool<OrcReaderBatch> pool;
@@ -222,7 +222,7 @@ private OrcVectorizedReader(final RecordReader orcReader, final Pool<OrcReaderBa
 
         @Nullable
         @Override
-        public RecordIterator<InternalRow> readBatch() throws IOException {
+        public ColumnarRowIterator readBatch() throws IOException {
             final OrcReaderBatch batch = getCachedEntry();
             final VectorizedRowBatch orcVectorBatch = batch.orcVectorizedRowBatch();
 
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index 2a62c0bc89471..2e792d153c1b1 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -31,8 +31,7 @@
 import org.apache.paimon.format.parquet.type.ParquetField;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.options.Options;
-import org.apache.paimon.reader.RecordReader;
-import org.apache.paimon.reader.RecordReader.RecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
@@ -307,7 +306,7 @@ private VectorizedColumnBatch createVectorizedColumnBatch(
         return new VectorizedColumnBatch(vectors);
     }
 
-    private class ParquetReader implements RecordReader<InternalRow> {
+    private class ParquetReader implements FileRecordReader<InternalRow> {
 
         private ParquetFileReader reader;
 
@@ -360,7 +359,7 @@ private ParquetReader(
 
         @Nullable
         @Override
-        public RecordIterator<InternalRow> readBatch() throws IOException {
+        public ColumnarRowIterator readBatch() throws IOException {
             final ParquetReaderBatch batch = getCachedEntry();
 
             if (!nextBatch(batch)) {
@@ -488,7 +487,7 @@ public void recycle() {
             recycler.recycle(this);
         }
 
-        public RecordIterator<InternalRow> convertAndGetIterator(long rowNumber) {
+        public ColumnarRowIterator convertAndGetIterator(long rowNumber) {
             result.reset(rowNumber);
             return result;
         }

From e0ae6c8f5634056bdee8dbc7309d269ac175d381 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Wed, 13 Nov 2024 15:49:52 +0800
Subject: [PATCH 011/157] [parquet] Fix nested array/map has no id in parquet
 files (#4513)

---
 .../apache/paimon/table/SpecialFields.java    |  34 +++-
 .../format/parquet/ParquetReaderFactory.java  |  33 ++--
 .../parquet/ParquetSchemaConverter.java       | 165 ++++++++----------
 .../format/parquet/ParquetReadWriteTest.java  |  29 ++-
 4 files changed, 142 insertions(+), 119 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java b/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
index 36f22a3107556..d438bfb0ffe9e 100644
--- a/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
+++ b/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
@@ -48,9 +48,18 @@
  * directly by id. These ids are not stored in {@link org.apache.paimon.types.DataField}.
  *
  * <ul>
- *   <li>Array element field: ID = 536870911 + <code>(array-field-id)</code>.
- *   <li>Map key field: ID = 536870911 + <code>(array-field-id)</code>.
- *   <li>Map value field: ID = 536870911 - <code>(array-field-id)</code>.
+ *   <li>Array element field: ID = 536870911 + 1024 * <code>(array-field-id)</code> + depth.
+ *   <li>Map key field: ID = 536870911 - 1024 * <code>(array-field-id)</code> - depth.
+ *   <li>Map value field: ID = 536870911 + 1024 * <code>(array-field-id)</code> + depth.
+ * </ul>
+ *
+ * <p>Examples:
+ *
+ * <ul>
+ *   <li>ARRAY(MAP(INT, ARRAY(INT))) type, outer array has field id 10, then map (element of outer
+ *       array) has field id 536870911 + 1024 * 10 + 1, map key (int) has field id 536870911 - 1024
+ *       * 10 - 2, map value (inner array) has field id 536870911 + 1024 * 10 + 2, inner array
+ *       element (int) has field id 536870911 + 1024 * 10 + 3
  * </ul>
  */
 public class SpecialFields {
@@ -95,16 +104,23 @@ public static boolean isSystemField(String field) {
     // ----------------------------------------------------------------------------------------
 
     public static final int STRUCTURED_TYPE_FIELD_ID_BASE = Integer.MAX_VALUE / 4;
+    public static final int STRUCTURED_TYPE_FIELD_DEPTH_LIMIT = 1 << 10;
 
-    public static int getArrayElementFieldId(int arrayFieldId) {
-        return STRUCTURED_TYPE_FIELD_ID_BASE + arrayFieldId;
+    public static int getArrayElementFieldId(int arrayFieldId, int depth) {
+        return STRUCTURED_TYPE_FIELD_ID_BASE
+                + arrayFieldId * STRUCTURED_TYPE_FIELD_DEPTH_LIMIT
+                + depth;
     }
 
-    public static int getMapKeyFieldId(int mapFieldId) {
-        return STRUCTURED_TYPE_FIELD_ID_BASE + mapFieldId;
+    public static int getMapKeyFieldId(int mapFieldId, int depth) {
+        return STRUCTURED_TYPE_FIELD_ID_BASE
+                - mapFieldId * STRUCTURED_TYPE_FIELD_DEPTH_LIMIT
+                - depth;
     }
 
-    public static int getMapValueFieldId(int mapFieldId) {
-        return STRUCTURED_TYPE_FIELD_ID_BASE - mapFieldId;
+    public static int getMapValueFieldId(int mapFieldId, int depth) {
+        return STRUCTURED_TYPE_FIELD_ID_BASE
+                + mapFieldId * STRUCTURED_TYPE_FIELD_DEPTH_LIMIT
+                + depth;
     }
 }
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index 2e792d153c1b1..cede205f4d513 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -87,8 +87,8 @@ public class ParquetReaderFactory implements FormatReaderFactory {
     private final Options conf;
 
     private final RowType projectedType;
-    private final String[] projectedFields;
-    private final DataType[] projectedTypes;
+    private final String[] projectedColumnNames;
+    private final DataField[] projectedFields;
     private final int batchSize;
     private final FilterCompat.Filter filter;
     private final Set<Integer> unknownFieldsIndices = new HashSet<>();
@@ -97,14 +97,15 @@ public ParquetReaderFactory(
             Options conf, RowType projectedType, int batchSize, FilterCompat.Filter filter) {
         this.conf = conf;
         this.projectedType = projectedType;
-        this.projectedFields = projectedType.getFieldNames().toArray(new String[0]);
-        this.projectedTypes = projectedType.getFieldTypes().toArray(new DataType[0]);
+        this.projectedColumnNames = projectedType.getFieldNames().toArray(new String[0]);
+        this.projectedFields = projectedType.getFields().toArray(new DataField[0]);
         this.batchSize = batchSize;
         this.filter = filter;
     }
 
     @Override
-    public ParquetReader createReader(FormatReaderFactory.Context context) throws IOException {
+    public RecordReader<InternalRow> createReader(FormatReaderFactory.Context context)
+            throws IOException {
         ParquetReadOptions.Builder builder =
                 ParquetReadOptions.builder().withRange(0, context.fileSize());
         setReadOptions(builder);
@@ -153,20 +154,20 @@ private void setReadOptions(ParquetReadOptions.Builder builder) {
 
     /** Clips `parquetSchema` according to `fieldNames`. */
     private MessageType clipParquetSchema(GroupType parquetSchema) {
-        Type[] types = new Type[projectedFields.length];
-        for (int i = 0; i < projectedFields.length; ++i) {
-            String fieldName = projectedFields[i];
+        Type[] types = new Type[projectedColumnNames.length];
+        for (int i = 0; i < projectedColumnNames.length; ++i) {
+            String fieldName = projectedColumnNames[i];
             if (!parquetSchema.containsField(fieldName)) {
                 LOG.warn(
                         "{} does not exist in {}, will fill the field with null.",
                         fieldName,
                         parquetSchema);
                 types[i] =
-                        ParquetSchemaConverter.convertToParquetType(fieldName, projectedTypes[i]);
+                        ParquetSchemaConverter.convertToParquetType(fieldName, projectedFields[i]);
                 unknownFieldsIndices.add(i);
             } else {
                 Type parquetType = parquetSchema.getType(fieldName);
-                types[i] = clipParquetType(projectedTypes[i], parquetType);
+                types[i] = clipParquetType(projectedFields[i].type(), parquetType);
             }
         }
 
@@ -220,7 +221,7 @@ private Type clipParquetType(DataType readType, Type parquetType) {
 
     private void checkSchema(MessageType fileSchema, MessageType requestedSchema)
             throws IOException, UnsupportedOperationException {
-        if (projectedFields.length != requestedSchema.getFieldCount()) {
+        if (projectedColumnNames.length != requestedSchema.getFieldCount()) {
             throw new RuntimeException(
                     "The quality of field type is incompatible with the request schema!");
         }
@@ -268,13 +269,13 @@ private ParquetReaderBatch createReaderBatch(
     }
 
     private WritableColumnVector[] createWritableVectors(MessageType requestedSchema) {
-        WritableColumnVector[] columns = new WritableColumnVector[projectedTypes.length];
+        WritableColumnVector[] columns = new WritableColumnVector[projectedFields.length];
         List<Type> types = requestedSchema.getFields();
-        for (int i = 0; i < projectedTypes.length; i++) {
+        for (int i = 0; i < projectedFields.length; i++) {
             columns[i] =
                     createWritableColumnVector(
                             batchSize,
-                            projectedTypes[i],
+                            projectedFields[i].type(),
                             types.get(i),
                             requestedSchema.getColumns(),
                             0);
@@ -290,7 +291,7 @@ private VectorizedColumnBatch createVectorizedColumnBatch(
             WritableColumnVector[] writableVectors) {
         ColumnVector[] vectors = new ColumnVector[writableVectors.length];
         for (int i = 0; i < writableVectors.length; i++) {
-            switch (projectedTypes[i].getTypeRoot()) {
+            switch (projectedFields[i].type().getTypeRoot()) {
                 case DECIMAL:
                     vectors[i] = new ParquetDecimalVector(writableVectors[i]);
                     break;
@@ -416,7 +417,7 @@ private void readNextRowGroup() throws IOException {
                 if (!unknownFieldsIndices.contains(i)) {
                     columnReaders[i] =
                             createColumnReader(
-                                    projectedTypes[i],
+                                    projectedFields[i].type(),
                                     types.get(i),
                                     requestedSchema.getColumns(),
                                     rowGroup,
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetSchemaConverter.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetSchemaConverter.java
index 5cf81c375a37d..708e5eb7ea3d4 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetSchemaConverter.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetSchemaConverter.java
@@ -22,7 +22,6 @@
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypeRoot;
 import org.apache.paimon.types.DecimalType;
 import org.apache.paimon.types.IntType;
 import org.apache.paimon.types.LocalZonedTimestampType;
@@ -39,9 +38,6 @@
 import org.apache.parquet.schema.Type;
 import org.apache.parquet.schema.Types;
 
-import java.util.ArrayList;
-import java.util.List;
-
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.FIXED_LEN_BYTE_ARRAY;
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT32;
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT64;
@@ -59,86 +55,110 @@ public static MessageType convertToParquetMessageType(String name, RowType rowTy
         return new MessageType(name, convertToParquetTypes(rowType));
     }
 
-    public static Type convertToParquetType(String name, DataType type) {
-        Type.Repetition repetition =
-                type.isNullable() ? Type.Repetition.OPTIONAL : Type.Repetition.REQUIRED;
-        return convertToParquetType(name, type, repetition);
+    public static Type convertToParquetType(String name, DataField field) {
+        return convertToParquetType(name, field.type(), field.id(), 0);
+    }
+
+    private static Type[] convertToParquetTypes(RowType rowType) {
+        return rowType.getFields().stream()
+                .map(f -> convertToParquetType(f.name(), f.type(), f.id(), 0))
+                .toArray(Type[]::new);
     }
 
-    private static Type convertToParquetType(
-            String name, DataType type, Type.Repetition repetition) {
+    private static Type convertToParquetType(String name, DataType type, int fieldId, int depth) {
+        Type.Repetition repetition =
+                type.isNullable() ? Type.Repetition.OPTIONAL : Type.Repetition.REQUIRED;
         switch (type.getTypeRoot()) {
             case CHAR:
             case VARCHAR:
                 return Types.primitive(PrimitiveType.PrimitiveTypeName.BINARY, repetition)
                         .as(LogicalTypeAnnotation.stringType())
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case BOOLEAN:
                 return Types.primitive(PrimitiveType.PrimitiveTypeName.BOOLEAN, repetition)
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case BINARY:
             case VARBINARY:
                 return Types.primitive(PrimitiveType.PrimitiveTypeName.BINARY, repetition)
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case DECIMAL:
                 int precision = ((DecimalType) type).getPrecision();
                 int scale = ((DecimalType) type).getScale();
                 if (is32BitDecimal(precision)) {
                     return Types.primitive(INT32, repetition)
                             .as(LogicalTypeAnnotation.decimalType(scale, precision))
-                            .named(name);
+                            .named(name)
+                            .withId(fieldId);
                 } else if (is64BitDecimal(precision)) {
                     return Types.primitive(INT64, repetition)
                             .as(LogicalTypeAnnotation.decimalType(scale, precision))
-                            .named(name);
+                            .named(name)
+                            .withId(fieldId);
                 } else {
                     return Types.primitive(FIXED_LEN_BYTE_ARRAY, repetition)
                             .as(LogicalTypeAnnotation.decimalType(scale, precision))
                             .length(computeMinBytesForDecimalPrecision(precision))
-                            .named(name);
+                            .named(name)
+                            .withId(fieldId);
                 }
             case TINYINT:
                 return Types.primitive(INT32, repetition)
                         .as(LogicalTypeAnnotation.intType(8, true))
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case SMALLINT:
                 return Types.primitive(INT32, repetition)
                         .as(LogicalTypeAnnotation.intType(16, true))
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case INTEGER:
-                return Types.primitive(INT32, repetition).named(name);
+                return Types.primitive(INT32, repetition).named(name).withId(fieldId);
             case BIGINT:
-                return Types.primitive(INT64, repetition).named(name);
+                return Types.primitive(INT64, repetition).named(name).withId(fieldId);
             case FLOAT:
                 return Types.primitive(PrimitiveType.PrimitiveTypeName.FLOAT, repetition)
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case DOUBLE:
                 return Types.primitive(PrimitiveType.PrimitiveTypeName.DOUBLE, repetition)
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case DATE:
                 return Types.primitive(INT32, repetition)
                         .as(LogicalTypeAnnotation.dateType())
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case TIME_WITHOUT_TIME_ZONE:
                 return Types.primitive(INT32, repetition)
                         .as(
                                 LogicalTypeAnnotation.timeType(
                                         true, LogicalTypeAnnotation.TimeUnit.MILLIS))
-                        .named(name);
+                        .named(name)
+                        .withId(fieldId);
             case TIMESTAMP_WITHOUT_TIME_ZONE:
                 TimestampType timestampType = (TimestampType) type;
                 return createTimestampWithLogicalType(
-                        name, timestampType.getPrecision(), repetition, false);
+                                name, timestampType.getPrecision(), repetition, false)
+                        .withId(fieldId);
             case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
                 LocalZonedTimestampType localZonedTimestampType = (LocalZonedTimestampType) type;
                 return createTimestampWithLogicalType(
-                        name, localZonedTimestampType.getPrecision(), repetition, true);
+                                name, localZonedTimestampType.getPrecision(), repetition, true)
+                        .withId(fieldId);
             case ARRAY:
                 ArrayType arrayType = (ArrayType) type;
-                return ConversionPatterns.listOfElements(
-                        repetition,
-                        name,
-                        convertToParquetType(LIST_ELEMENT_NAME, arrayType.getElementType()));
+                Type elementParquetType =
+                        convertToParquetType(
+                                        LIST_ELEMENT_NAME,
+                                        arrayType.getElementType(),
+                                        fieldId,
+                                        depth + 1)
+                                .withId(SpecialFields.getArrayElementFieldId(fieldId, depth + 1));
+                return ConversionPatterns.listOfElements(repetition, name, elementParquetType)
+                        .withId(fieldId);
             case MAP:
                 MapType mapType = (MapType) type;
                 DataType keyType = mapType.getKeyType();
@@ -147,12 +167,20 @@ private static Type convertToParquetType(
                     // it as not nullable
                     keyType = keyType.copy(false);
                 }
+                Type mapKeyParquetType =
+                        convertToParquetType(MAP_KEY_NAME, keyType, fieldId, depth + 1)
+                                .withId(SpecialFields.getMapKeyFieldId(fieldId, depth + 1));
+                Type mapValueParquetType =
+                        convertToParquetType(
+                                        MAP_VALUE_NAME, mapType.getValueType(), fieldId, depth + 1)
+                                .withId(SpecialFields.getMapValueFieldId(fieldId, depth + 1));
                 return ConversionPatterns.mapType(
-                        repetition,
-                        name,
-                        MAP_REPEATED_NAME,
-                        convertToParquetType(MAP_KEY_NAME, keyType),
-                        convertToParquetType(MAP_VALUE_NAME, mapType.getValueType()));
+                                repetition,
+                                name,
+                                MAP_REPEATED_NAME,
+                                mapKeyParquetType,
+                                mapValueParquetType)
+                        .withId(fieldId);
             case MULTISET:
                 MultisetType multisetType = (MultisetType) type;
                 DataType elementType = multisetType.getElementType();
@@ -161,15 +189,23 @@ private static Type convertToParquetType(
                     // so we configure it as not nullable
                     elementType = elementType.copy(false);
                 }
+                Type multisetKeyParquetType =
+                        convertToParquetType(MAP_KEY_NAME, elementType, fieldId, depth + 1)
+                                .withId(SpecialFields.getMapKeyFieldId(fieldId, depth + 1));
+                Type multisetValueParquetType =
+                        convertToParquetType(MAP_VALUE_NAME, new IntType(false), fieldId, depth + 1)
+                                .withId(SpecialFields.getMapValueFieldId(fieldId, depth + 1));
                 return ConversionPatterns.mapType(
-                        repetition,
-                        name,
-                        MAP_REPEATED_NAME,
-                        convertToParquetType(MAP_KEY_NAME, elementType),
-                        convertToParquetType(MAP_VALUE_NAME, new IntType(false)));
+                                repetition,
+                                name,
+                                MAP_REPEATED_NAME,
+                                multisetKeyParquetType,
+                                multisetValueParquetType)
+                        .withId(fieldId);
             case ROW:
                 RowType rowType = (RowType) type;
-                return new GroupType(repetition, name, convertToParquetTypes(rowType));
+                return new GroupType(repetition, name, convertToParquetTypes(rowType))
+                        .withId(fieldId);
             default:
                 throw new UnsupportedOperationException("Unsupported type: " + type);
         }
@@ -194,53 +230,6 @@ private static Type createTimestampWithLogicalType(
         }
     }
 
-    private static List<Type> convertToParquetTypes(RowType rowType) {
-        List<Type> types = new ArrayList<>(rowType.getFieldCount());
-        for (DataField field : rowType.getFields()) {
-            Type parquetType = convertToParquetType(field.name(), field.type());
-            Type typeWithId = parquetType.withId(field.id());
-            if (field.type().getTypeRoot() == DataTypeRoot.ARRAY) {
-                GroupType groupType = (GroupType) parquetType;
-                GroupType wrapperType = (GroupType) groupType.getFields().get(0);
-                Type elementTypeWithId =
-                        wrapperType
-                                .getFields()
-                                .get(0)
-                                .withId(SpecialFields.getArrayElementFieldId(field.id()));
-                typeWithId =
-                        ConversionPatterns.listOfElements(
-                                        groupType.getRepetition(),
-                                        groupType.getName(),
-                                        elementTypeWithId)
-                                .withId(field.id());
-            } else if (field.type().getTypeRoot() == DataTypeRoot.MAP
-                    || field.type().getTypeRoot() == DataTypeRoot.MULTISET) {
-                GroupType groupType = (GroupType) parquetType;
-                GroupType wrapperType = (GroupType) groupType.getFields().get(0);
-                Type keyTypeWithId =
-                        wrapperType
-                                .getFields()
-                                .get(0)
-                                .withId(SpecialFields.getMapKeyFieldId(field.id()));
-                Type valueTypeWithId =
-                        wrapperType
-                                .getFields()
-                                .get(1)
-                                .withId(SpecialFields.getMapValueFieldId(field.id()));
-                typeWithId =
-                        ConversionPatterns.mapType(
-                                        groupType.getRepetition(),
-                                        groupType.getName(),
-                                        MAP_REPEATED_NAME,
-                                        keyTypeWithId,
-                                        valueTypeWithId)
-                                .withId(field.id());
-            }
-            types.add(typeWithId);
-        }
-        return types;
-    }
-
     public static int computeMinBytesForDecimalPrecision(int precision) {
         int numBytes = 1;
         while (Math.pow(2.0, 8 * numBytes - 1) < Math.pow(10.0, precision)) {
diff --git a/paimon-format/src/test/java/org/apache/paimon/format/parquet/ParquetReadWriteTest.java b/paimon-format/src/test/java/org/apache/paimon/format/parquet/ParquetReadWriteTest.java
index 099811d98b528..ffe4d6008296a 100644
--- a/paimon-format/src/test/java/org/apache/paimon/format/parquet/ParquetReadWriteTest.java
+++ b/paimon-format/src/test/java/org/apache/paimon/format/parquet/ParquetReadWriteTest.java
@@ -97,6 +97,7 @@
 import java.util.stream.Collectors;
 
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT32;
+import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT64;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
@@ -489,11 +490,17 @@ public void testConvertToParquetTypeWithId() {
                         new DataField(0, "a", DataTypes.INT()),
                         new DataField(1, "b", DataTypes.ARRAY(DataTypes.STRING())),
                         new DataField(
-                                2, "c", DataTypes.MAP(DataTypes.INT(), new RowType(nestedFields))));
+                                2,
+                                "c",
+                                DataTypes.MAP(
+                                        DataTypes.INT(),
+                                        DataTypes.MAP(
+                                                DataTypes.BIGINT(), new RowType(nestedFields)))));
         RowType rowType = new RowType(fields);
 
         int baseId = 536870911;
-        Type mapValueType =
+        int depthLimit = 1 << 10;
+        Type innerMapValueType =
                 new GroupType(
                                 Type.Repetition.OPTIONAL,
                                 "value",
@@ -506,7 +513,17 @@ public void testConvertToParquetTypeWithId() {
                                         .as(LogicalTypeAnnotation.stringType())
                                         .named("v2")
                                         .withId(4))
-                        .withId(baseId - 2);
+                        .withId(baseId + depthLimit * 2 + 2);
+        Type outerMapValueType =
+                ConversionPatterns.mapType(
+                                Type.Repetition.OPTIONAL,
+                                "value",
+                                "key_value",
+                                Types.primitive(INT64, Type.Repetition.REQUIRED)
+                                        .named("key")
+                                        .withId(baseId - depthLimit * 2 - 2),
+                                innerMapValueType)
+                        .withId(baseId + depthLimit * 2 + 1);
         Type expected =
                 new MessageType(
                         "table",
@@ -519,7 +536,7 @@ public void testConvertToParquetTypeWithId() {
                                                         Type.Repetition.OPTIONAL)
                                                 .as(LogicalTypeAnnotation.stringType())
                                                 .named("element")
-                                                .withId(baseId + 1))
+                                                .withId(baseId + depthLimit + 1))
                                 .withId(1),
                         ConversionPatterns.mapType(
                                         Type.Repetition.OPTIONAL,
@@ -527,8 +544,8 @@ public void testConvertToParquetTypeWithId() {
                                         "key_value",
                                         Types.primitive(INT32, Type.Repetition.REQUIRED)
                                                 .named("key")
-                                                .withId(baseId + 2),
-                                        mapValueType)
+                                                .withId(baseId - depthLimit * 2 - 1),
+                                        outerMapValueType)
                                 .withId(2));
         Type actual = ParquetSchemaConverter.convertToParquetMessageType("table", rowType);
         assertThat(actual).isEqualTo(expected);

From 19119e3c073619bc5db9ce52c151527af919b8cc Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Wed, 13 Nov 2024 16:02:39 +0800
Subject: [PATCH 012/157] [hotfix] Fix compile error in ParquetReaderFactory

---
 .../org/apache/paimon/format/parquet/ParquetReaderFactory.java  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index cede205f4d513..53b4b1634b5fc 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -104,7 +104,7 @@ public ParquetReaderFactory(
     }
 
     @Override
-    public RecordReader<InternalRow> createReader(FormatReaderFactory.Context context)
+    public FileRecordReader<InternalRow> createReader(FormatReaderFactory.Context context)
             throws IOException {
         ParquetReadOptions.Builder builder =
                 ParquetReadOptions.builder().withRange(0, context.fileSize());

From 7eaf30f776b9d1573d86a274ac53633d267262af Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Wed, 13 Nov 2024 17:02:55 +0800
Subject: [PATCH 013/157] [common] Fix overflow problem of
 NumericToBooleanCastRule (#4519)

---
 .../org/apache/paimon/casting/NumericToBooleanCastRule.java    | 2 +-
 .../test/java/org/apache/paimon/flink/SchemaChangeITCase.java  | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/NumericToBooleanCastRule.java b/paimon-common/src/main/java/org/apache/paimon/casting/NumericToBooleanCastRule.java
index 06fa89fe35994..5b47741e6d351 100644
--- a/paimon-common/src/main/java/org/apache/paimon/casting/NumericToBooleanCastRule.java
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/NumericToBooleanCastRule.java
@@ -37,6 +37,6 @@ private NumericToBooleanCastRule() {
 
     @Override
     public CastExecutor<Number, Boolean> create(DataType inputType, DataType targetType) {
-        return value -> value.intValue() != 0;
+        return value -> value.longValue() != 0;
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
index ba161fe84008f..a2ef1d5c8acec 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
@@ -251,7 +251,8 @@ public void testModifyColumnTypeFromNumericToDecimal() {
     public void testModifyColumnTypeBooleanAndNumeric() {
         // boolean To numeric and numeric To boolean
         sql("CREATE TABLE T (a BOOLEAN, b BOOLEAN, c TINYINT, d INT, e BIGINT, f DOUBLE)");
-        sql("INSERT INTO T VALUES(true, false, cast(0 as TINYINT), 1 , 123, 3.14)");
+        sql(
+                "INSERT INTO T VALUES(true, false, cast(0 as TINYINT), 1 , -9223372036854775808, 3.14)");
 
         sql("ALTER TABLE T MODIFY (a TINYINT, b INT, c BOOLEAN, d BOOLEAN, e BOOLEAN)");
         List<Row> result = sql("SHOW CREATE TABLE T");

From 30bf5036d6117aedce7297dacec23155a7d5778c Mon Sep 17 00:00:00 2001
From: "liming.1018" <liming.1018@bytedance.com>
Date: Wed, 13 Nov 2024 17:04:39 +0800
Subject: [PATCH 014/157] [flink] support multiple writers writing to the same
 partition when using kafka as logSystem in unaware bucket mode. (#4516)

---
 .../apache/paimon/manifest/ManifestCommittable.java    |  7 ++++---
 .../src/test/java/org/apache/paimon/TestFileStore.java |  3 ++-
 .../manifest/ManifestCommittableSerializerTest.java    |  2 +-
 .../org/apache/paimon/flink/sink/StoreCommitter.java   | 10 +++++++++-
 .../apache/paimon/flink/sink/StoreMultiCommitter.java  | 10 ++++++----
 .../sink/WrappedManifestCommittableSerializerTest.java |  2 +-
 6 files changed, 23 insertions(+), 11 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestCommittable.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestCommittable.java
index 61c4619bd6d6a..b4abd0e9ec0ed 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestCommittable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestCommittable.java
@@ -62,13 +62,14 @@ public void addFileCommittable(CommitMessage commitMessage) {
         commitMessages.add(commitMessage);
     }
 
-    public void addLogOffset(int bucket, long offset) {
-        if (logOffsets.containsKey(bucket)) {
+    public void addLogOffset(int bucket, long offset, boolean allowDuplicate) {
+        if (!allowDuplicate && logOffsets.containsKey(bucket)) {
             throw new RuntimeException(
                     String.format(
                             "bucket-%d appears multiple times, which is not possible.", bucket));
         }
-        logOffsets.put(bucket, offset);
+        long newOffset = Math.max(logOffsets.getOrDefault(bucket, offset), offset);
+        logOffsets.put(bucket, newOffset);
     }
 
     public long identifier() {
diff --git a/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java b/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
index 303879337780f..5218a515a3374 100644
--- a/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
+++ b/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
@@ -222,7 +222,8 @@ public List<Snapshot> commitData(
                 null,
                 Collections.emptyList(),
                 (commit, committable) -> {
-                    logOffsets.forEach(committable::addLogOffset);
+                    logOffsets.forEach(
+                            (bucket, offset) -> committable.addLogOffset(bucket, offset, false));
                     commit.commit(committable, Collections.emptyMap());
                 });
     }
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerTest.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerTest.java
index c179a2c0a789f..8de8309bc8fbb 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerTest.java
@@ -83,7 +83,7 @@ private static void addFileCommittables(
 
         if (!committable.logOffsets().containsKey(bucket)) {
             int offset = ID.incrementAndGet();
-            committable.addLogOffset(bucket, offset);
+            committable.addLogOffset(bucket, offset, false);
             assertThat(committable.logOffsets().get(bucket)).isEqualTo(offset);
         }
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCommitter.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCommitter.java
index d237f4da56cf7..4908b99317bae 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCommitter.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCommitter.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.flink.sink.partition.PartitionListeners;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.manifest.ManifestCommittable;
+import org.apache.paimon.table.BucketMode;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.sink.CommitMessage;
 import org.apache.paimon.table.sink.CommitMessageImpl;
@@ -44,6 +45,7 @@ public class StoreCommitter implements Committer<Committable, ManifestCommittabl
     private final TableCommitImpl commit;
     @Nullable private final CommitterMetrics committerMetrics;
     private final PartitionListeners partitionListeners;
+    private final boolean allowLogOffsetDuplicate;
 
     public StoreCommitter(FileStoreTable table, TableCommit commit, Context context) {
         this.commit = (TableCommitImpl) commit;
@@ -60,6 +62,7 @@ public StoreCommitter(FileStoreTable table, TableCommit commit, Context context)
         } catch (Exception e) {
             throw new RuntimeException(e);
         }
+        allowLogOffsetDuplicate = table.bucketMode() == BucketMode.BUCKET_UNAWARE;
     }
 
     @VisibleForTesting
@@ -94,7 +97,8 @@ public ManifestCommittable combine(
                 case LOG_OFFSET:
                     LogOffsetCommittable offset =
                             (LogOffsetCommittable) committable.wrappedCommittable();
-                    manifestCommittable.addLogOffset(offset.bucket(), offset.offset());
+                    manifestCommittable.addLogOffset(
+                            offset.bucket(), offset.offset(), allowLogOffsetDuplicate);
                     break;
             }
         }
@@ -138,6 +142,10 @@ public void close() throws Exception {
         partitionListeners.close();
     }
 
+    public boolean allowLogOffsetDuplicate() {
+        return allowLogOffsetDuplicate;
+    }
+
     private void calcNumBytesAndRecordsOut(List<ManifestCommittable> committables) {
         if (committerMetrics == null) {
             return;
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreMultiCommitter.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreMultiCommitter.java
index aeb3e1857b9b7..537a98f97fb03 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreMultiCommitter.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreMultiCommitter.java
@@ -92,11 +92,11 @@ public WrappedManifestCommittable combine(
             WrappedManifestCommittable wrappedManifestCommittable,
             List<MultiTableCommittable> committables) {
         for (MultiTableCommittable committable : committables) {
+            Identifier identifier =
+                    Identifier.create(committable.getDatabase(), committable.getTable());
             ManifestCommittable manifestCommittable =
                     wrappedManifestCommittable.computeCommittableIfAbsent(
-                            Identifier.create(committable.getDatabase(), committable.getTable()),
-                            checkpointId,
-                            watermark);
+                            identifier, checkpointId, watermark);
 
             switch (committable.kind()) {
                 case FILE:
@@ -106,7 +106,9 @@ public WrappedManifestCommittable combine(
                 case LOG_OFFSET:
                     LogOffsetCommittable offset =
                             (LogOffsetCommittable) committable.wrappedCommittable();
-                    manifestCommittable.addLogOffset(offset.bucket(), offset.offset());
+                    StoreCommitter committer = tableCommitters.get(identifier);
+                    manifestCommittable.addLogOffset(
+                            offset.bucket(), offset.offset(), committer.allowLogOffsetDuplicate());
                     break;
             }
         }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WrappedManifestCommittableSerializerTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WrappedManifestCommittableSerializerTest.java
index 298f3155ba34e..b0aa76f157ac8 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WrappedManifestCommittableSerializerTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WrappedManifestCommittableSerializerTest.java
@@ -98,7 +98,7 @@ public static void addFileCommittables(
 
         if (!committable.logOffsets().containsKey(bucket)) {
             int offset = ID.incrementAndGet();
-            committable.addLogOffset(bucket, offset);
+            committable.addLogOffset(bucket, offset, false);
             assertThat(committable.logOffsets().get(bucket)).isEqualTo(offset);
         }
     }

From c7dfcfa18411af1511035b1481229499008eda05 Mon Sep 17 00:00:00 2001
From: zhangdong <zhangdong@selectdb.com>
Date: Wed, 13 Nov 2024 17:05:24 +0800
Subject: [PATCH 015/157] [core] Partitions system table support time travel
 (#4511)

---
 .../paimon/table/system/PartitionsTable.java  |  2 +-
 .../table/system/PartitionsTableTest.java     | 24 ++++++++++++++++---
 2 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/PartitionsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/PartitionsTable.java
index 736347b9aff3e..7e0b1f1d75682 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/PartitionsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/PartitionsTable.java
@@ -178,7 +178,7 @@ public RecordReader<InternalRow> createReader(Split split) throws IOException {
                 throw new IllegalArgumentException("Unsupported split: " + split.getClass());
             }
 
-            List<PartitionEntry> partitions = fileStoreTable.newSnapshotReader().partitionEntries();
+            List<PartitionEntry> partitions = fileStoreTable.newScan().listPartitionEntries();
 
             RowDataToObjectArrayConverter converter =
                     new RowDataToObjectArrayConverter(
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/system/PartitionsTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/system/PartitionsTableTest.java
index a17dc75466a68..8d12dc707bf5d 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/system/PartitionsTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/system/PartitionsTableTest.java
@@ -40,6 +40,7 @@
 import org.junit.jupiter.api.Test;
 
 import java.util.ArrayList;
+import java.util.Collections;
 import java.util.List;
 
 import static org.assertj.core.api.Assertions.assertThat;
@@ -76,7 +77,7 @@ public void before() throws Exception {
         partitionsTable = (PartitionsTable) catalog.getTable(filesTableId);
 
         // snapshot 1: append
-        write(table, GenericRow.of(1, 1, 1), GenericRow.of(1, 2, 5));
+        write(table, GenericRow.of(1, 1, 1), GenericRow.of(1, 3, 5));
 
         write(table, GenericRow.of(1, 1, 3), GenericRow.of(1, 2, 4));
     }
@@ -85,19 +86,36 @@ public void before() throws Exception {
     public void testPartitionRecordCount() throws Exception {
         List<InternalRow> expectedRow = new ArrayList<>();
         expectedRow.add(GenericRow.of(BinaryString.fromString("[1]"), 2L));
-        expectedRow.add(GenericRow.of(BinaryString.fromString("[2]"), 2L));
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[2]"), 1L));
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[3]"), 1L));
 
         // Only read partition and record count, record size may not stable.
         List<InternalRow> result = read(partitionsTable, new int[][] {{0}, {1}});
         assertThat(result).containsExactlyInAnyOrderElementsOf(expectedRow);
     }
 
+    @Test
+    public void testPartitionTimeTravel() throws Exception {
+        List<InternalRow> expectedRow = new ArrayList<>();
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[1]"), 1L));
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[3]"), 1L));
+
+        // Only read partition and record count, record size may not stable.
+        List<InternalRow> result =
+                read(
+                        partitionsTable.copy(
+                                Collections.singletonMap(CoreOptions.SCAN_VERSION.key(), "1")),
+                        new int[][] {{0}, {1}});
+        assertThat(result).containsExactlyInAnyOrderElementsOf(expectedRow);
+    }
+
     @Test
     public void testPartitionValue() throws Exception {
         write(table, GenericRow.of(2, 1, 3), GenericRow.of(3, 1, 4));
         List<InternalRow> expectedRow = new ArrayList<>();
         expectedRow.add(GenericRow.of(BinaryString.fromString("[1]"), 4L, 3L));
-        expectedRow.add(GenericRow.of(BinaryString.fromString("[2]"), 2L, 2L));
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[2]"), 1L, 1L));
+        expectedRow.add(GenericRow.of(BinaryString.fromString("[3]"), 1L, 1L));
 
         List<InternalRow> result = read(partitionsTable, new int[][] {{0}, {1}, {3}});
         assertThat(result).containsExactlyInAnyOrderElementsOf(expectedRow);

From c95c3e6f9132dc89fd39cf0427d9b5fba544476c Mon Sep 17 00:00:00 2001
From: "liming.1018" <liming.1018@bytedance.com>
Date: Thu, 14 Nov 2024 10:57:02 +0800
Subject: [PATCH 016/157] [core] supports using dynamic parameters to query the
 system table of a specified branch. (#4527)

---
 .../table/system/AggregationFieldsTable.java  | 18 +++----
 .../paimon/table/system/BranchesTable.java    | 13 +++--
 .../paimon/table/system/ConsumersTable.java   | 18 +++----
 .../paimon/table/system/OptionsTable.java     | 18 +++----
 .../paimon/table/system/SchemasTable.java     | 18 +++----
 .../paimon/table/system/SnapshotsTable.java   | 17 ++----
 .../apache/paimon/table/system/TagsTable.java | 18 +++----
 .../apache/paimon/flink/BranchSqlITCase.java  | 52 +++++++++++++++++++
 8 files changed, 97 insertions(+), 75 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
index a88bde9e5d720..10a046ca70b52 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
@@ -80,17 +80,13 @@ public class AggregationFieldsTable implements ReadonlyTable {
     private final Path location;
     private final String branch;
 
-    public AggregationFieldsTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                CoreOptions.branch(dataTable.schema().options()));
-    }
+    private final FileStoreTable dataTable;
 
-    public AggregationFieldsTable(FileIO fileIO, Path location, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
-        this.branch = branchName;
+    public AggregationFieldsTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -120,7 +116,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new AggregationFieldsTable(fileIO, location, branch);
+        return new AggregationFieldsTable(dataTable.copy(dynamicOptions));
     }
 
     private class SchemasScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/BranchesTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/BranchesTable.java
index f523f20e9d200..384a2eee92c82 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/BranchesTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/BranchesTable.java
@@ -81,13 +81,12 @@ public class BranchesTable implements ReadonlyTable {
     private final FileIO fileIO;
     private final Path location;
 
-    public BranchesTable(FileStoreTable dataTable) {
-        this(dataTable.fileIO(), dataTable.location());
-    }
+    private final FileStoreTable dataTable;
 
-    public BranchesTable(FileIO fileIO, Path location) {
-        this.fileIO = fileIO;
-        this.location = location;
+    public BranchesTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -117,7 +116,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new BranchesTable(fileIO, location);
+        return new BranchesTable(dataTable.copy(dynamicOptions));
     }
 
     private class BranchesScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/ConsumersTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/ConsumersTable.java
index 9f7d12961e2f1..7e4816b13510b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/ConsumersTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/ConsumersTable.java
@@ -74,17 +74,13 @@ public class ConsumersTable implements ReadonlyTable {
     private final Path location;
     private final String branch;
 
-    public ConsumersTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                CoreOptions.branch(dataTable.schema().options()));
-    }
+    private final FileStoreTable dataTable;
 
-    public ConsumersTable(FileIO fileIO, Path location, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
-        this.branch = branchName;
+    public ConsumersTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -114,7 +110,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new ConsumersTable(fileIO, location, branch);
+        return new ConsumersTable(dataTable.copy(dynamicOptions));
     }
 
     private class ConsumersScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
index b4a3b82a2f5f7..c7dec03343d09 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
@@ -72,17 +72,13 @@ public class OptionsTable implements ReadonlyTable {
     private final Path location;
     private final String branch;
 
-    public OptionsTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                CoreOptions.branch(dataTable.schema().options()));
-    }
+    private final FileStoreTable dataTable;
 
-    public OptionsTable(FileIO fileIO, Path location, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
-        this.branch = branchName;
+    public OptionsTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -112,7 +108,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new OptionsTable(fileIO, location, branch);
+        return new OptionsTable(dataTable.copy(dynamicOptions));
     }
 
     private class OptionsScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
index 86e2598c609cf..d0df75b34f512 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
@@ -102,17 +102,13 @@ public class SchemasTable implements ReadonlyTable {
     private final Path location;
     private final String branch;
 
-    public SchemasTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                CoreOptions.branch(dataTable.schema().options()));
-    }
+    private final FileStoreTable dataTable;
 
-    public SchemasTable(FileIO fileIO, Path location, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
-        this.branch = branchName;
+    public SchemasTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -142,7 +138,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new SchemasTable(fileIO, location, branch);
+        return new SchemasTable(dataTable.copy(dynamicOptions));
     }
 
     private class SchemasScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
index a958432194400..10e5b691acc32 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
@@ -116,19 +116,10 @@ public class SnapshotsTable implements ReadonlyTable {
     private final FileStoreTable dataTable;
 
     public SnapshotsTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                dataTable,
-                CoreOptions.branch(dataTable.schema().options()));
-    }
-
-    public SnapshotsTable(
-            FileIO fileIO, Path location, FileStoreTable dataTable, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
         this.dataTable = dataTable;
-        this.branch = branchName;
     }
 
     @Override
@@ -158,7 +149,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new SnapshotsTable(fileIO, location, dataTable.copy(dynamicOptions), branch);
+        return new SnapshotsTable(dataTable.copy(dynamicOptions));
     }
 
     private class SnapshotsScan extends ReadOnceTableScan {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/TagsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/TagsTable.java
index 4d1b4e22ab189..9aafdb5983fd5 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/TagsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/TagsTable.java
@@ -95,17 +95,13 @@ public class TagsTable implements ReadonlyTable {
     private final Path location;
     private final String branch;
 
-    public TagsTable(FileStoreTable dataTable) {
-        this(
-                dataTable.fileIO(),
-                dataTable.location(),
-                CoreOptions.branch(dataTable.schema().options()));
-    }
+    private final FileStoreTable dataTable;
 
-    public TagsTable(FileIO fileIO, Path location, String branchName) {
-        this.fileIO = fileIO;
-        this.location = location;
-        this.branch = branchName;
+    public TagsTable(FileStoreTable dataTable) {
+        this.fileIO = dataTable.fileIO();
+        this.location = dataTable.location();
+        this.branch = CoreOptions.branch(dataTable.schema().options());
+        this.dataTable = dataTable;
     }
 
     @Override
@@ -135,7 +131,7 @@ public InnerTableRead newRead() {
 
     @Override
     public Table copy(Map<String, String> dynamicOptions) {
-        return new TagsTable(fileIO, location, branch);
+        return new TagsTable(dataTable.copy(dynamicOptions));
     }
 
     private class TagsScan extends ReadOnceTableScan {
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
index 1d33a9e8a6f25..c25d99cb44591 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
@@ -347,6 +347,11 @@ public void testBranchOptionsTable() throws Exception {
                         "+I[bucket, 2]",
                         "+I[snapshot.time-retained, 1 h]",
                         "+I[scan.infer-parallelism, false]");
+        assertThat(collectResult("SELECT * FROM t$options /*+ OPTIONS('branch'='test') */"))
+                .containsExactlyInAnyOrder(
+                        "+I[bucket, 2]",
+                        "+I[snapshot.time-retained, 1 h]",
+                        "+I[scan.infer-parallelism, false]");
     }
 
     @Test
@@ -360,6 +365,10 @@ public void testBranchSchemasTable() throws Exception {
         sql("ALTER TABLE t$branch_b1 SET ('snapshot.time-retained' = '5 h')");
         assertThat(collectResult("SELECT schema_id FROM t$branch_b1$schemas order by schema_id"))
                 .containsExactlyInAnyOrder("+I[0]", "+I[1]");
+        assertThat(
+                        collectResult(
+                                "SELECT schema_id FROM t$schemas /*+ OPTIONS('branch'='b1') */ order by schema_id"))
+                .containsExactlyInAnyOrder("+I[0]", "+I[1]");
     }
 
     @Test
@@ -373,6 +382,8 @@ public void testBranchAuditLogTable() throws Exception {
         sql("INSERT INTO t$branch_b1 VALUES (3, 4)");
         assertThat(collectResult("SELECT * FROM t$branch_b1$audit_log"))
                 .containsExactlyInAnyOrder("+I[+I, 3, 4]");
+        assertThat(collectResult("SELECT * FROM t$audit_log /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[+I, 3, 4]");
     }
 
     @Test
@@ -385,6 +396,8 @@ public void testBranchReadOptimizedTable() throws Exception {
         sql("INSERT INTO t$branch_b1 VALUES (3, 4)");
         assertThat(collectResult("SELECT * FROM t$branch_b1$ro"))
                 .containsExactlyInAnyOrder("+I[3, 4]");
+        assertThat(collectResult("SELECT * FROM t$ro /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[3, 4]");
     }
 
     @Test
@@ -400,6 +413,10 @@ public void testBranchFilesTable() throws Exception {
                 .containsExactlyInAnyOrder("+I[{a=1, b=2}]");
         assertThat(collectResult("SELECT min_value_stats FROM t$branch_b1$files"))
                 .containsExactlyInAnyOrder("+I[{a=3, b=4}]", "+I[{a=5, b=6}]");
+        assertThat(
+                        collectResult(
+                                "SELECT min_value_stats FROM t$files /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[{a=3, b=4}]", "+I[{a=5, b=6}]");
     }
 
     @Test
@@ -416,6 +433,10 @@ public void testBranchTagsTable() throws Exception {
                 .containsExactlyInAnyOrder("+I[tag1, 1, 1]");
         assertThat(collectResult("SELECT tag_name,snapshot_id,record_count FROM t$branch_b1$tags"))
                 .containsExactlyInAnyOrder("+I[tag1, 1, 1]", "+I[tag2, 2, 2]");
+        assertThat(
+                        collectResult(
+                                "SELECT tag_name,snapshot_id,record_count FROM t$tags /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[tag1, 1, 1]", "+I[tag2, 2, 2]");
     }
 
     @Test
@@ -435,6 +456,8 @@ public void testBranchConsumersTable() throws Exception {
         assertThat(collectResult("SELECT * FROM t$consumers")).isEmpty();
         assertThat(collectResult("SELECT * FROM t$branch_b1$consumers"))
                 .containsExactlyInAnyOrder("+I[id1, 2]");
+        assertThat(collectResult("SELECT * FROM t$consumers /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[id1, 2]");
     }
 
     @Test
@@ -458,6 +481,31 @@ public void testBranchManifestsTable() {
                             .isTrue();
                     assertThat((long) row.getField(2)).isGreaterThan(0L);
                 });
+        List<Row> dynamicOptionRes =
+                sql(
+                        "SELECT schema_id, file_name, file_size FROM t$manifests /*+ OPTIONS('branch'='b1') */");
+        assertThat(dynamicOptionRes).containsExactlyInAnyOrderElementsOf(res);
+    }
+
+    @Test
+    public void testBranchSnapshotsTable() throws Exception {
+        sql("CREATE TABLE t (a INT, b INT)");
+        sql("INSERT INTO t VALUES (1, 2)");
+
+        sql("CALL sys.create_branch('default.t', 'b1')");
+        sql("INSERT INTO t$branch_b1 VALUES (3, 4)");
+        sql("INSERT INTO t$branch_b1 VALUES (5, 6)");
+
+        assertThat(collectResult("SELECT snapshot_id, schema_id, commit_kind FROM t$snapshots"))
+                .containsExactlyInAnyOrder("+I[1, 0, APPEND]");
+        assertThat(
+                        collectResult(
+                                "SELECT snapshot_id, schema_id, commit_kind FROM t$branch_b1$snapshots"))
+                .containsExactlyInAnyOrder("+I[1, 0, APPEND]", "+I[2, 0, APPEND]");
+        assertThat(
+                        collectResult(
+                                "SELECT snapshot_id, schema_id, commit_kind FROM t$snapshots /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[1, 0, APPEND]", "+I[2, 0, APPEND]");
     }
 
     @Test
@@ -479,6 +527,10 @@ public void testBranchPartitionsTable() throws Exception {
                         collectResult(
                                 "SELECT `partition`, record_count, file_count FROM t$branch_b1$partitions"))
                 .containsExactlyInAnyOrder("+I[[1], 2, 2]", "+I[[2], 3, 2]");
+        assertThat(
+                        collectResult(
+                                "SELECT `partition`, record_count, file_count FROM t$partitions /*+ OPTIONS('branch'='b1') */"))
+                .containsExactlyInAnyOrder("+I[[1], 2, 2]", "+I[[2], 3, 2]");
     }
 
     @Test

From 84a97ee952365c0cdbcf816c2caefc5003ec1ee7 Mon Sep 17 00:00:00 2001
From: Yubin Li <lixin58688@163.com>
Date: Thu, 14 Nov 2024 11:05:12 +0800
Subject: [PATCH 017/157] [core] Support deleting rows in partial update of
 specific sequence group (#4525)

---
 .../merge-engine/partial-update.md            |  3 +-
 .../generated/core_configuration.html         |  6 ++
 .../java/org/apache/paimon/CoreOptions.java   |  8 ++
 .../compact/PartialUpdateMergeFunction.java   | 47 +++++++++--
 .../PartialUpdateMergeFunctionTest.java       | 36 ++++++++
 .../table/PrimaryKeyFileStoreTableTest.java   | 84 +++++++++++++++++++
 6 files changed, 178 insertions(+), 6 deletions(-)

diff --git a/docs/content/primary-key-table/merge-engine/partial-update.md b/docs/content/primary-key-table/merge-engine/partial-update.md
index 83b664c1bc7f5..d664694e96652 100644
--- a/docs/content/primary-key-table/merge-engine/partial-update.md
+++ b/docs/content/primary-key-table/merge-engine/partial-update.md
@@ -51,7 +51,8 @@ By default, Partial update can not accept delete records, you can choose one of
 - Configure 'ignore-delete' to ignore delete records.
 - Configure 'partial-update.remove-record-on-delete' to remove the whole row when receiving delete records.
 - Configure 'sequence-group's to retract partial columns.
-  {{< /hint >}}
+  * Configure 'partial-update.remove-record-on-sequence-group' to remove the whole row when receiving delete records of specified sequence group.
+{{< /hint >}}
 
 ## Sequence Group
 
diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 7287cacc2c53e..3efeaeb3e8a9a 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -557,6 +557,12 @@
             <td>Boolean</td>
             <td>Whether to remove the whole row in partial-update engine when -D records are received.</td>
         </tr>
+        <tr>
+            <td><h5>partial-update.remove-record-on-sequence-group</h5></td>
+            <td style="word-wrap: break-word;">(none)</td>
+            <td>String</td>
+            <td>Whether to remove the whole row in partial-update engine when -D records of specified sequence group are received.</td>
+        </tr>
         <tr>
             <td><h5>partition</h5></td>
             <td style="word-wrap: break-word;">(none)</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index db603c5b61f06..9875e2fac45f2 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -631,6 +631,14 @@ public class CoreOptions implements Serializable {
                     .withDescription(
                             "Whether to remove the whole row in partial-update engine when -D records are received.");
 
+    @Immutable
+    public static final ConfigOption<String> PARTIAL_UPDATE_REMOVE_RECORD_ON_SEQUENCE_GROUP =
+            key("partial-update.remove-record-on-sequence-group")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription(
+                            "Whether to remove the whole row in partial-update engine when -D records of specified sequence group are received.");
+
     @Immutable
     public static final ConfigOption<String> ROWKIND_FIELD =
             key("rowkind.field")
diff --git a/paimon-core/src/main/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunction.java b/paimon-core/src/main/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunction.java
index 4d720cb3f0750..ab25794129baf 100644
--- a/paimon-core/src/main/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunction.java
+++ b/paimon-core/src/main/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunction.java
@@ -52,6 +52,7 @@
 import static org.apache.paimon.CoreOptions.FIELDS_PREFIX;
 import static org.apache.paimon.CoreOptions.FIELDS_SEPARATOR;
 import static org.apache.paimon.CoreOptions.PARTIAL_UPDATE_REMOVE_RECORD_ON_DELETE;
+import static org.apache.paimon.CoreOptions.PARTIAL_UPDATE_REMOVE_RECORD_ON_SEQUENCE_GROUP;
 import static org.apache.paimon.utils.InternalRowUtils.createFieldGetters;
 
 /**
@@ -68,6 +69,7 @@ public class PartialUpdateMergeFunction implements MergeFunction<KeyValue> {
     private final boolean fieldSequenceEnabled;
     private final Map<Integer, FieldAggregator> fieldAggregators;
     private final boolean removeRecordOnDelete;
+    private final Set<Integer> sequenceGroupPartialDelete;
 
     private InternalRow currentKey;
     private long latestSequenceNumber;
@@ -81,13 +83,15 @@ protected PartialUpdateMergeFunction(
             Map<Integer, FieldsComparator> fieldSeqComparators,
             Map<Integer, FieldAggregator> fieldAggregators,
             boolean fieldSequenceEnabled,
-            boolean removeRecordOnDelete) {
+            boolean removeRecordOnDelete,
+            Set<Integer> sequenceGroupPartialDelete) {
         this.getters = getters;
         this.ignoreDelete = ignoreDelete;
         this.fieldSeqComparators = fieldSeqComparators;
         this.fieldAggregators = fieldAggregators;
         this.fieldSequenceEnabled = fieldSequenceEnabled;
         this.removeRecordOnDelete = removeRecordOnDelete;
+        this.sequenceGroupPartialDelete = sequenceGroupPartialDelete;
     }
 
     @Override
@@ -220,8 +224,15 @@ private void retractWithSequenceGroup(KeyValue kv) {
                             .anyMatch(field -> field == index)) {
                         for (int field : seqComparator.compareFields()) {
                             if (!updatedSequenceFields.contains(field)) {
-                                row.setField(field, getters[field].getFieldOrNull(kv.value()));
-                                updatedSequenceFields.add(field);
+                                if (kv.valueKind() == RowKind.DELETE
+                                        && sequenceGroupPartialDelete.contains(field)) {
+                                    currentDeleteRow = true;
+                                    row = new GenericRow(getters.length);
+                                    return;
+                                } else {
+                                    row.setField(field, getters[field].getFieldOrNull(kv.value()));
+                                    updatedSequenceFields.add(field);
+                                }
                             }
                         }
                     } else {
@@ -278,13 +289,21 @@ private static class Factory implements MergeFunctionFactory<KeyValue> {
 
         private final boolean removeRecordOnDelete;
 
+        private final String removeRecordOnSequenceGroup;
+
+        private Set<Integer> sequenceGroupPartialDelete;
+
         private Factory(Options options, RowType rowType, List<String> primaryKeys) {
             this.ignoreDelete = options.get(CoreOptions.IGNORE_DELETE);
             this.rowType = rowType;
             this.tableTypes = rowType.getFieldTypes();
+            this.removeRecordOnSequenceGroup =
+                    options.get(PARTIAL_UPDATE_REMOVE_RECORD_ON_SEQUENCE_GROUP);
+            this.sequenceGroupPartialDelete = new HashSet<>();
 
             List<String> fieldNames = rowType.getFieldNames();
             this.fieldSeqComparators = new HashMap<>();
+            Map<String, Integer> sequenceGroupMap = new HashMap<>();
             for (Map.Entry<String, String> entry : options.toMap().entrySet()) {
                 String k = entry.getKey();
                 String v = entry.getValue();
@@ -323,6 +342,7 @@ private Factory(Options options, RowType rowType, List<String> primaryKeys) {
                             fieldName -> {
                                 int index = fieldNames.indexOf(fieldName);
                                 fieldSeqComparators.put(index, userDefinedSeqComparator);
+                                sequenceGroupMap.put(fieldName, index);
                             });
                 }
             }
@@ -345,6 +365,21 @@ private Factory(Options options, RowType rowType, List<String> primaryKeys) {
                     String.format(
                             "sequence group and %s have conflicting behavior so should not be enabled at the same time.",
                             PARTIAL_UPDATE_REMOVE_RECORD_ON_DELETE));
+
+            if (removeRecordOnSequenceGroup != null) {
+                String[] sequenceGroupArr = removeRecordOnSequenceGroup.split(FIELDS_SEPARATOR);
+                Preconditions.checkState(
+                        sequenceGroupMap.keySet().containsAll(Arrays.asList(sequenceGroupArr)),
+                        String.format(
+                                "field '%s' defined in '%s' option must be part of sequence groups",
+                                removeRecordOnSequenceGroup,
+                                PARTIAL_UPDATE_REMOVE_RECORD_ON_SEQUENCE_GROUP.key()));
+                sequenceGroupPartialDelete =
+                        Arrays.stream(sequenceGroupArr)
+                                .filter(sequenceGroupMap::containsKey)
+                                .map(sequenceGroupMap::get)
+                                .collect(Collectors.toSet());
+            }
         }
 
         @Override
@@ -405,7 +440,8 @@ public MergeFunction<KeyValue> create(@Nullable int[][] projection) {
                         projectedSeqComparators,
                         projectedAggregators,
                         !fieldSeqComparators.isEmpty(),
-                        removeRecordOnDelete);
+                        removeRecordOnDelete,
+                        sequenceGroupPartialDelete);
             } else {
                 Map<Integer, FieldsComparator> fieldSeqComparators = new HashMap<>();
                 this.fieldSeqComparators.forEach(
@@ -419,7 +455,8 @@ public MergeFunction<KeyValue> create(@Nullable int[][] projection) {
                         fieldSeqComparators,
                         fieldAggregators,
                         !fieldSeqComparators.isEmpty(),
-                        removeRecordOnDelete);
+                        removeRecordOnDelete,
+                        sequenceGroupPartialDelete);
             }
         }
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunctionTest.java b/paimon-core/src/test/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunctionTest.java
index a6e1b5f90fe23..93f634944e6e8 100644
--- a/paimon-core/src/test/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunctionTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/mergetree/compact/PartialUpdateMergeFunctionTest.java
@@ -95,6 +95,42 @@ public void testSequenceGroup() {
         validate(func, 1, null, null, 6, null, null, 6);
     }
 
+    @Test
+    public void testSequenceGroupPartialDelete() {
+        Options options = new Options();
+        options.set("fields.f3.sequence-group", "f1,f2");
+        options.set("fields.f6.sequence-group", "f4,f5");
+        options.set("partial-update.remove-record-on-sequence-group", "f6");
+        RowType rowType =
+                RowType.of(
+                        DataTypes.INT(),
+                        DataTypes.INT(),
+                        DataTypes.INT(),
+                        DataTypes.INT(),
+                        DataTypes.INT(),
+                        DataTypes.INT(),
+                        DataTypes.INT());
+        MergeFunction<KeyValue> func =
+                PartialUpdateMergeFunction.factory(options, rowType, ImmutableList.of("f0"))
+                        .create();
+        func.reset();
+        add(func, 1, 1, 1, 1, 1, 1, 1);
+        add(func, 1, 2, 2, 2, 2, 2, null);
+        validate(func, 1, 2, 2, 2, 1, 1, 1);
+        add(func, 1, 3, 3, 1, 3, 3, 3);
+        validate(func, 1, 2, 2, 2, 3, 3, 3);
+
+        // delete
+        add(func, RowKind.DELETE, 1, 1, 1, 3, 1, 1, null);
+        validate(func, 1, null, null, 3, 3, 3, 3);
+        add(func, RowKind.DELETE, 1, 1, 1, 3, 1, 1, 4);
+        validate(func, null, null, null, null, null, null, null);
+        add(func, 1, 4, 4, 4, 5, 5, 5);
+        validate(func, 1, 4, 4, 4, 5, 5, 5);
+        add(func, RowKind.DELETE, 1, 1, 1, 6, 1, 1, 6);
+        validate(func, null, null, null, null, null, null, null);
+    }
+
     @Test
     public void testMultiSequenceFields() {
         Options options = new Options();
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index 4917d076014a9..133913c487cdf 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -1213,6 +1213,90 @@ public void testPartialUpdateRemoveRecordOnDelete() throws Exception {
         commit.close();
     }
 
+    @Test
+    public void testPartialUpdateRemoveRecordOnSequenceGroup() throws Exception {
+        RowType rowType =
+                RowType.of(
+                        new DataType[] {
+                            DataTypes.INT(),
+                            DataTypes.INT(),
+                            DataTypes.INT(),
+                            DataTypes.INT(),
+                            DataTypes.INT(),
+                            DataTypes.INT(),
+                            DataTypes.INT()
+                        },
+                        new String[] {"pt", "a", "b", "seq1", "c", "d", "seq2"});
+        FileStoreTable table =
+                createFileStoreTable(
+                        options -> {
+                            options.set("merge-engine", "partial-update");
+                            options.set("fields.seq1.sequence-group", "b");
+                            options.set("fields.seq2.sequence-group", "c,d");
+                            options.set("partial-update.remove-record-on-sequence-group", "seq2");
+                        },
+                        rowType);
+        FileStoreTable wrongTable =
+                createFileStoreTable(
+                        options -> {
+                            options.set("merge-engine", "partial-update");
+                            options.set("fields.seq1.sequence-group", "b");
+                            options.set("fields.seq2.sequence-group", "c,d");
+                            options.set("partial-update.remove-record-on-sequence-group", "b");
+                        },
+                        rowType);
+        Function<InternalRow, String> rowToString = row -> internalRowToString(row, rowType);
+
+        assertThatThrownBy(() -> wrongTable.newWrite(""))
+                .hasMessageContaining(
+                        "field 'b' defined in 'partial-update.remove-record-on-sequence-group' option must be part of sequence groups");
+
+        SnapshotReader snapshotReader = table.newSnapshotReader();
+        TableRead read = table.newRead();
+        StreamTableWrite write = table.newWrite("");
+        StreamTableCommit commit = table.newCommit("");
+        // 1. Inserts
+        write.write(GenericRow.of(1, 1, 10, 1, 20, 20, 1));
+        write.write(GenericRow.of(1, 1, 11, 2, 25, 25, 0));
+        write.write(GenericRow.of(1, 1, 12, 1, 29, 29, 2));
+        commit.commit(0, write.prepareCommit(true, 0));
+        List<String> result =
+                getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).containsExactlyInAnyOrder("+I[1, 1, 11, 2, 29, 29, 2]");
+
+        // 2. Update Before
+        write.write(GenericRow.ofKind(RowKind.UPDATE_BEFORE, 1, 1, 11, 2, 29, 29, 2));
+        commit.commit(1, write.prepareCommit(true, 1));
+        result = getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).containsExactlyInAnyOrder("+I[1, 1, NULL, 2, NULL, NULL, 2]");
+
+        // 3. Update After
+        write.write(GenericRow.ofKind(RowKind.UPDATE_AFTER, 1, 1, 11, 2, 30, 30, 3));
+        commit.commit(2, write.prepareCommit(true, 2));
+        result = getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).containsExactlyInAnyOrder("+I[1, 1, 11, 2, 30, 30, 3]");
+
+        // 4. Retracts
+        write.write(GenericRow.ofKind(RowKind.DELETE, 1, 1, 12, 3, 30, 30, 2));
+        commit.commit(3, write.prepareCommit(true, 3));
+        result = getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).containsExactlyInAnyOrder("+I[1, 1, NULL, 3, 30, 30, 3]");
+
+        write.write(GenericRow.ofKind(RowKind.DELETE, 1, 1, 12, 2, 30, 31, 5));
+        commit.commit(4, write.prepareCommit(true, 4));
+        result = getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).isEmpty();
+
+        // 5. Inserts
+        write.write(GenericRow.of(1, 1, 11, 2, 30, 31, 6));
+        commit.commit(5, write.prepareCommit(true, 5));
+        result = getResult(read, toSplits(snapshotReader.read().dataSplits()), rowToString);
+        assertThat(result).containsExactlyInAnyOrder("+I[1, 1, 11, 2, 30, 31, 6]");
+
+        write.close();
+        commit.close();
+    }
+
     @Test
     public void testPartialUpdateWithAgg() throws Exception {
         RowType rowType =

From 7e1fe395df0831a9d65bf4b6126562252a7a7bf2 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Thu, 14 Nov 2024 18:36:02 +0800
Subject: [PATCH 018/157] [flink] Support updating row type nested in array/map
 in Flink (#4528)

---
 .../paimon/casting/CastElementGetter.java     |  41 ++++
 .../paimon/casting/CastFieldGetter.java       |   3 +
 .../apache/paimon/casting/CastedArray.java    | 201 ++++++++++++++++++
 .../org/apache/paimon/casting/CastedMap.java  |  70 ++++++
 .../org/apache/paimon/casting/CastedRow.java  |   2 -
 .../paimon/schema/SchemaEvolutionUtil.java    |  99 +++++----
 .../apache/paimon/schema/SchemaManager.java   |  44 +++-
 .../paimon/schema/SchemaManagerTest.java      |  50 ++++-
 .../org/apache/paimon/flink/FlinkCatalog.java |  41 +++-
 .../paimon/flink/SchemaChangeITCase.java      |  66 +++++-
 10 files changed, 562 insertions(+), 55 deletions(-)
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/casting/CastElementGetter.java
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/casting/CastedArray.java
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/casting/CastedMap.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/CastElementGetter.java b/paimon-common/src/main/java/org/apache/paimon/casting/CastElementGetter.java
new file mode 100644
index 0000000000000..b8a91f572a355
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/CastElementGetter.java
@@ -0,0 +1,41 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.casting;
+
+import org.apache.paimon.data.InternalArray;
+
+/** Get element from array and cast it according to specific {@link CastExecutor}. */
+public class CastElementGetter {
+
+    private final InternalArray.ElementGetter elementGetter;
+    private final CastExecutor<Object, Object> castExecutor;
+
+    @SuppressWarnings("unchecked")
+    public CastElementGetter(
+            InternalArray.ElementGetter elementGetter, CastExecutor<?, ?> castExecutor) {
+        this.elementGetter = elementGetter;
+        this.castExecutor = (CastExecutor<Object, Object>) castExecutor;
+    }
+
+    @SuppressWarnings("unchecked")
+    public <V> V getElementOrNull(InternalArray array, int pos) {
+        Object value = elementGetter.getElementOrNull(array, pos);
+        return value == null ? null : (V) castExecutor.cast(value);
+    }
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/CastFieldGetter.java b/paimon-common/src/main/java/org/apache/paimon/casting/CastFieldGetter.java
index 02168300a8420..208ef5f30f5bd 100644
--- a/paimon-common/src/main/java/org/apache/paimon/casting/CastFieldGetter.java
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/CastFieldGetter.java
@@ -24,14 +24,17 @@
  * Get field value from row with given pos and cast it according to specific {@link CastExecutor}.
  */
 public class CastFieldGetter {
+
     private final InternalRow.FieldGetter fieldGetter;
     private final CastExecutor<Object, Object> castExecutor;
 
+    @SuppressWarnings("unchecked")
     public CastFieldGetter(InternalRow.FieldGetter fieldGetter, CastExecutor<?, ?> castExecutor) {
         this.fieldGetter = fieldGetter;
         this.castExecutor = (CastExecutor<Object, Object>) castExecutor;
     }
 
+    @SuppressWarnings("unchecked")
     public <V> V getFieldOrNull(InternalRow row) {
         Object value = fieldGetter.getFieldOrNull(row);
         return value == null ? null : (V) castExecutor.cast(value);
diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/CastedArray.java b/paimon-common/src/main/java/org/apache/paimon/casting/CastedArray.java
new file mode 100644
index 0000000000000..778b11d1f8873
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/CastedArray.java
@@ -0,0 +1,201 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.casting;
+
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.data.Decimal;
+import org.apache.paimon.data.InternalArray;
+import org.apache.paimon.data.InternalMap;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.Timestamp;
+
+/**
+ * An implementation of {@link InternalArray} which provides a casted view of the underlying {@link
+ * InternalArray}.
+ *
+ * <p>It reads data from underlying {@link InternalArray} according to source logical type and casts
+ * it with specific {@link CastExecutor}.
+ */
+public class CastedArray implements InternalArray {
+
+    private final CastElementGetter castElementGetter;
+    private InternalArray array;
+
+    protected CastedArray(CastElementGetter castElementGetter) {
+        this.castElementGetter = castElementGetter;
+    }
+
+    /**
+     * Replaces the underlying {@link InternalArray} backing this {@link CastedArray}.
+     *
+     * <p>This method replaces the array in place and does not return a new object. This is done for
+     * performance reasons.
+     */
+    public static CastedArray from(CastElementGetter castElementGetter) {
+        return new CastedArray(castElementGetter);
+    }
+
+    public CastedArray replaceArray(InternalArray array) {
+        this.array = array;
+        return this;
+    }
+
+    @Override
+    public int size() {
+        return array.size();
+    }
+
+    @Override
+    public boolean[] toBooleanArray() {
+        boolean[] result = new boolean[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public byte[] toByteArray() {
+        byte[] result = new byte[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public short[] toShortArray() {
+        short[] result = new short[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public int[] toIntArray() {
+        int[] result = new int[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public long[] toLongArray() {
+        long[] result = new long[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public float[] toFloatArray() {
+        float[] result = new float[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public double[] toDoubleArray() {
+        double[] result = new double[size()];
+        for (int i = 0; i < result.length; i++) {
+            result[i] = castElementGetter.getElementOrNull(array, i);
+        }
+        return result;
+    }
+
+    @Override
+    public boolean isNullAt(int pos) {
+        return castElementGetter.getElementOrNull(array, pos) == null;
+    }
+
+    @Override
+    public boolean getBoolean(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public byte getByte(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public short getShort(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public int getInt(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public long getLong(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public float getFloat(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public double getDouble(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public BinaryString getString(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public Decimal getDecimal(int pos, int precision, int scale) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public Timestamp getTimestamp(int pos, int precision) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public byte[] getBinary(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public InternalArray getArray(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public InternalMap getMap(int pos) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+
+    @Override
+    public InternalRow getRow(int pos, int numFields) {
+        return castElementGetter.getElementOrNull(array, pos);
+    }
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/CastedMap.java b/paimon-common/src/main/java/org/apache/paimon/casting/CastedMap.java
new file mode 100644
index 0000000000000..4068407ca71c4
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/CastedMap.java
@@ -0,0 +1,70 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.casting;
+
+import org.apache.paimon.data.InternalArray;
+import org.apache.paimon.data.InternalMap;
+
+/**
+ * An implementation of {@link InternalMap} which provides a casted view of the underlying {@link
+ * InternalMap}.
+ *
+ * <p>It reads data from underlying {@link InternalMap} according to source logical type and casts
+ * it with specific {@link CastExecutor}.
+ */
+public class CastedMap implements InternalMap {
+
+    private final CastedArray castedValueArray;
+    private InternalMap map;
+
+    protected CastedMap(CastElementGetter castValueGetter) {
+        this.castedValueArray = CastedArray.from(castValueGetter);
+    }
+
+    /**
+     * Replaces the underlying {@link InternalMap} backing this {@link CastedMap}.
+     *
+     * <p>This method replaces the map in place and does not return a new object. This is done for
+     * performance reasons.
+     */
+    public static CastedMap from(CastElementGetter castValueGetter) {
+        return new CastedMap(castValueGetter);
+    }
+
+    public CastedMap replaceMap(InternalMap map) {
+        this.castedValueArray.replaceArray(map.valueArray());
+        this.map = map;
+        return this;
+    }
+
+    @Override
+    public int size() {
+        return map.size();
+    }
+
+    @Override
+    public InternalArray keyArray() {
+        return map.keyArray();
+    }
+
+    @Override
+    public InternalArray valueArray() {
+        return castedValueArray;
+    }
+}
diff --git a/paimon-common/src/main/java/org/apache/paimon/casting/CastedRow.java b/paimon-common/src/main/java/org/apache/paimon/casting/CastedRow.java
index 25c5744255ef4..f9216d10b3a85 100644
--- a/paimon-common/src/main/java/org/apache/paimon/casting/CastedRow.java
+++ b/paimon-common/src/main/java/org/apache/paimon/casting/CastedRow.java
@@ -34,8 +34,6 @@
  *
  * <p>It reads data from underlying {@link InternalRow} according to source logical type and casts
  * it with specific {@link CastExecutor}.
- *
- * <p>Note: This class supports only top-level castings, not nested castings.
  */
 public class CastedRow implements InternalRow {
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaEvolutionUtil.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaEvolutionUtil.java
index b5d7307073595..0ae2798c29e00 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaEvolutionUtil.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaEvolutionUtil.java
@@ -19,10 +19,15 @@
 package org.apache.paimon.schema;
 
 import org.apache.paimon.KeyValue;
+import org.apache.paimon.casting.CastElementGetter;
 import org.apache.paimon.casting.CastExecutor;
 import org.apache.paimon.casting.CastExecutors;
 import org.apache.paimon.casting.CastFieldGetter;
+import org.apache.paimon.casting.CastedArray;
+import org.apache.paimon.casting.CastedMap;
 import org.apache.paimon.casting.CastedRow;
+import org.apache.paimon.data.InternalArray;
+import org.apache.paimon.data.InternalMap;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.predicate.LeafPredicate;
 import org.apache.paimon.predicate.Predicate;
@@ -31,7 +36,6 @@
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.MapType;
-import org.apache.paimon.types.MultisetType;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.InternalRowUtils;
 import org.apache.paimon.utils.ProjectedRow;
@@ -372,6 +376,7 @@ private static CastFieldGetter[] createCastFieldGetterMapping(
             List<DataField> tableFields, List<DataField> dataFields, int[] indexMapping) {
         CastFieldGetter[] converterMapping = new CastFieldGetter[tableFields.size()];
         boolean castExist = false;
+
         for (int i = 0; i < tableFields.size(); i++) {
             int dataIndex = indexMapping == null ? i : indexMapping[i];
             if (dataIndex < 0) {
@@ -380,53 +385,39 @@ private static CastFieldGetter[] createCastFieldGetterMapping(
             } else {
                 DataField tableField = tableFields.get(i);
                 DataField dataField = dataFields.get(dataIndex);
-                if (dataField.type().equalsIgnoreNullable(tableField.type())) {
-                    // Create getter with index i and projected row data will convert to underlying
-                    // data
-                    converterMapping[i] =
-                            new CastFieldGetter(
-                                    InternalRowUtils.createNullCheckingFieldGetter(
-                                            dataField.type(), i),
-                                    CastExecutors.identityCastExecutor());
-                } else {
-                    // TODO support column type evolution in nested type
-                    checkState(
-                            !(tableField.type() instanceof MapType
-                                    || dataField.type() instanceof ArrayType
-                                    || dataField.type() instanceof MultisetType),
-                            "Only support column type evolution in atomic and row data type.");
-
-                    CastExecutor<?, ?> castExecutor;
-                    if (tableField.type() instanceof RowType
-                            && dataField.type() instanceof RowType) {
-                        castExecutor =
-                                createRowCastExecutor(
-                                        (RowType) dataField.type(), (RowType) tableField.type());
-                    } else {
-                        castExecutor = CastExecutors.resolve(dataField.type(), tableField.type());
-                    }
-                    checkNotNull(
-                            castExecutor,
-                            "Cannot cast from type "
-                                    + dataField.type()
-                                    + " to type "
-                                    + tableField.type());
-
-                    // Create getter with index i and projected row data will convert to underlying
-                    // data
-                    converterMapping[i] =
-                            new CastFieldGetter(
-                                    InternalRowUtils.createNullCheckingFieldGetter(
-                                            dataField.type(), i),
-                                    castExecutor);
+                if (!dataField.type().equalsIgnoreNullable(tableField.type())) {
                     castExist = true;
                 }
+
+                // Create getter with index i and projected row data will convert to underlying data
+                converterMapping[i] =
+                        new CastFieldGetter(
+                                InternalRowUtils.createNullCheckingFieldGetter(dataField.type(), i),
+                                createCastExecutor(dataField.type(), tableField.type()));
             }
         }
 
         return castExist ? converterMapping : null;
     }
 
+    private static CastExecutor<?, ?> createCastExecutor(DataType inputType, DataType targetType) {
+        if (targetType.equalsIgnoreNullable(inputType)) {
+            return CastExecutors.identityCastExecutor();
+        } else if (inputType instanceof RowType && targetType instanceof RowType) {
+            return createRowCastExecutor((RowType) inputType, (RowType) targetType);
+        } else if (inputType instanceof ArrayType && targetType instanceof ArrayType) {
+            return createArrayCastExecutor((ArrayType) inputType, (ArrayType) targetType);
+        } else if (inputType instanceof MapType && targetType instanceof MapType) {
+            return createMapCastExecutor((MapType) inputType, (MapType) targetType);
+        } else {
+            return checkNotNull(
+                    CastExecutors.resolve(inputType, targetType),
+                    "Cannot cast from type %s to type %s",
+                    inputType,
+                    targetType);
+        }
+    }
+
     private static CastExecutor<InternalRow, InternalRow> createRowCastExecutor(
             RowType inputType, RowType targetType) {
         int[] indexMapping = createIndexMapping(targetType.getFields(), inputType.getFields());
@@ -446,4 +437,32 @@ private static CastExecutor<InternalRow, InternalRow> createRowCastExecutor(
             return value;
         };
     }
+
+    private static CastExecutor<InternalArray, InternalArray> createArrayCastExecutor(
+            ArrayType inputType, ArrayType targetType) {
+        CastElementGetter castElementGetter =
+                new CastElementGetter(
+                        InternalArray.createElementGetter(inputType.getElementType()),
+                        createCastExecutor(
+                                inputType.getElementType(), targetType.getElementType()));
+
+        CastedArray castedArray = CastedArray.from(castElementGetter);
+        return castedArray::replaceArray;
+    }
+
+    private static CastExecutor<InternalMap, InternalMap> createMapCastExecutor(
+            MapType inputType, MapType targetType) {
+        checkState(
+                inputType.getKeyType().equals(targetType.getKeyType()),
+                "Cannot cast map type %s to map type %s, because they have different key types.",
+                inputType.getKeyType(),
+                targetType.getKeyType());
+        CastElementGetter castElementGetter =
+                new CastElementGetter(
+                        InternalArray.createElementGetter(inputType.getValueType()),
+                        createCastExecutor(inputType.getValueType(), targetType.getValueType()));
+
+        CastedMap castedMap = CastedMap.from(castElementGetter);
+        return castedMap::replaceMap;
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index 86e365a88f831..a84348810b990 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -37,9 +37,11 @@
 import org.apache.paimon.schema.SchemaChange.UpdateColumnType;
 import org.apache.paimon.schema.SchemaChange.UpdateComment;
 import org.apache.paimon.table.FileStoreTableFactory;
+import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DataTypeCasts;
+import org.apache.paimon.types.MapType;
 import org.apache.paimon.types.ReassignFieldId;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.BranchManager;
@@ -636,17 +638,17 @@ public void updateIntermediateColumn(List<DataField> newFields, int depth)
                     continue;
                 }
 
+                String fullFieldName =
+                        String.join(".", Arrays.asList(updateFieldNames).subList(0, depth + 1));
                 List<DataField> nestedFields =
-                        new ArrayList<>(
-                                ((org.apache.paimon.types.RowType) field.type()).getFields());
+                        new ArrayList<>(extractRowType(field.type(), fullFieldName).getFields());
                 updateIntermediateColumn(nestedFields, depth + 1);
                 newFields.set(
                         i,
                         new DataField(
                                 field.id(),
                                 field.name(),
-                                new org.apache.paimon.types.RowType(
-                                        field.type().isNullable(), nestedFields),
+                                wrapNewRowType(field.type(), nestedFields),
                                 field.description()));
                 return;
             }
@@ -656,6 +658,40 @@ public void updateIntermediateColumn(List<DataField> newFields, int depth)
                     String.join(".", Arrays.asList(updateFieldNames).subList(0, depth + 1)));
         }
 
+        private RowType extractRowType(DataType type, String fullFieldName) {
+            switch (type.getTypeRoot()) {
+                case ROW:
+                    return (RowType) type;
+                case ARRAY:
+                    return extractRowType(((ArrayType) type).getElementType(), fullFieldName);
+                case MAP:
+                    return extractRowType(((MapType) type).getValueType(), fullFieldName);
+                default:
+                    throw new IllegalArgumentException(
+                            fullFieldName + " is not a structured type.");
+            }
+        }
+
+        private DataType wrapNewRowType(DataType type, List<DataField> nestedFields) {
+            switch (type.getTypeRoot()) {
+                case ROW:
+                    return new RowType(type.isNullable(), nestedFields);
+                case ARRAY:
+                    return new ArrayType(
+                            type.isNullable(),
+                            wrapNewRowType(((ArrayType) type).getElementType(), nestedFields));
+                case MAP:
+                    MapType mapType = (MapType) type;
+                    return new MapType(
+                            type.isNullable(),
+                            mapType.getKeyType(),
+                            wrapNewRowType(mapType.getValueType(), nestedFields));
+                default:
+                    throw new IllegalStateException(
+                            "Trying to wrap a row type in " + type + ". This is unexpected.");
+            }
+        }
+
         protected abstract void updateLastColumn(List<DataField> newFields, String fieldName)
                 throws Catalog.ColumnNotExistException, Catalog.ColumnAlreadyExistException;
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
index 088cb72f92e6c..f0d6543699659 100644
--- a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
@@ -31,6 +31,7 @@
 import org.apache.paimon.table.FileStoreTableFactory;
 import org.apache.paimon.table.sink.TableCommitImpl;
 import org.apache.paimon.table.sink.TableWriteImpl;
+import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.BigIntType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataTypes;
@@ -690,7 +691,7 @@ public void testUpdateNestedColumnType() throws Exception {
 
         SchemaChange updateColumnType =
                 SchemaChange.updateColumnType(
-                        new String[] {"v", "f2", "f1"}, DataTypes.BIGINT(), true);
+                        new String[] {"v", "f2", "f1"}, DataTypes.BIGINT(), false);
         manager.commitChanges(updateColumnType);
 
         innerType =
@@ -708,8 +709,53 @@ public void testUpdateNestedColumnType() throws Exception {
 
         SchemaChange middleColumnNotExistUpdateColumnType =
                 SchemaChange.updateColumnType(
-                        new String[] {"v", "invalid", "f1"}, DataTypes.BIGINT(), true);
+                        new String[] {"v", "invalid", "f1"}, DataTypes.BIGINT(), false);
         assertThatCode(() -> manager.commitChanges(middleColumnNotExistUpdateColumnType))
                 .hasMessageContaining("Column v.invalid does not exist");
     }
+
+    @Test
+    public void testUpdateRowTypeInArrayAndMap() throws Exception {
+        RowType innerType =
+                RowType.of(
+                        new DataField(2, "f1", DataTypes.INT()),
+                        new DataField(3, "f2", DataTypes.BIGINT()));
+        RowType outerType =
+                RowType.of(
+                        new DataField(0, "k", DataTypes.INT()),
+                        new DataField(
+                                1, "v", new ArrayType(new MapType(DataTypes.INT(), innerType))));
+
+        Schema schema =
+                new Schema(
+                        outerType.getFields(),
+                        Collections.singletonList("k"),
+                        Collections.emptyList(),
+                        new HashMap<>(),
+                        "");
+        SchemaManager manager = new SchemaManager(LocalFileIO.create(), path);
+        manager.createTable(schema);
+
+        SchemaChange addColumn =
+                SchemaChange.addColumn(
+                        new String[] {"v", "f3"},
+                        DataTypes.STRING(),
+                        null,
+                        SchemaChange.Move.first("f3"));
+        SchemaChange dropColumn = SchemaChange.dropColumn(new String[] {"v", "f2"});
+        SchemaChange updateColumnType =
+                SchemaChange.updateColumnType(new String[] {"v", "f1"}, DataTypes.BIGINT(), false);
+        manager.commitChanges(addColumn, dropColumn, updateColumnType);
+
+        innerType =
+                RowType.of(
+                        new DataField(4, "f3", DataTypes.STRING()),
+                        new DataField(2, "f1", DataTypes.BIGINT()));
+        outerType =
+                RowType.of(
+                        new DataField(0, "k", DataTypes.INT()),
+                        new DataField(
+                                1, "v", new ArrayType(new MapType(DataTypes.INT(), innerType))));
+        assertThat(manager.latest().get().logicalRowType()).isEqualTo(outerType);
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
index ae30fa569d59e..09fc0328ef655 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
@@ -673,14 +673,13 @@ private void generateNestedColumnUpdates(
             org.apache.paimon.types.DataType oldType,
             org.apache.paimon.types.DataType newType,
             List<SchemaChange> schemaChanges) {
+        String joinedNames = String.join(".", fieldNames);
         if (oldType.getTypeRoot() == DataTypeRoot.ROW) {
             Preconditions.checkArgument(
                     newType.getTypeRoot() == DataTypeRoot.ROW,
-                    "Column "
-                            + String.join(".", fieldNames)
-                            + " can only be updated to row type, and cannot be updated to "
-                            + newType
-                            + " type");
+                    "Column %s can only be updated to row type, and cannot be updated to %s type",
+                    joinedNames,
+                    newType.getTypeRoot());
             org.apache.paimon.types.RowType oldRowType = (org.apache.paimon.types.RowType) oldType;
             org.apache.paimon.types.RowType newRowType = (org.apache.paimon.types.RowType) newType;
 
@@ -699,7 +698,7 @@ private void generateNestedColumnUpdates(
                             lastIdx < idx,
                             "Order of existing fields in column %s must be kept the same. "
                                     + "However, field %s and %s have changed their orders.",
-                            String.join(".", fieldNames),
+                            joinedNames,
                             lastFieldName,
                             name);
                     lastIdx = idx;
@@ -751,6 +750,36 @@ private void generateNestedColumnUpdates(
                             fullFieldNames, oldField.type(), field.type(), schemaChanges);
                 }
             }
+        } else if (oldType.getTypeRoot() == DataTypeRoot.ARRAY) {
+            Preconditions.checkArgument(
+                    newType.getTypeRoot() == DataTypeRoot.ARRAY,
+                    "Column %s can only be updated to array type, and cannot be updated to %s type",
+                    joinedNames,
+                    newType);
+            generateNestedColumnUpdates(
+                    fieldNames,
+                    ((org.apache.paimon.types.ArrayType) oldType).getElementType(),
+                    ((org.apache.paimon.types.ArrayType) newType).getElementType(),
+                    schemaChanges);
+        } else if (oldType.getTypeRoot() == DataTypeRoot.MAP) {
+            Preconditions.checkArgument(
+                    newType.getTypeRoot() == DataTypeRoot.MAP,
+                    "Column %s can only be updated to map type, and cannot be updated to %s type",
+                    joinedNames,
+                    newType);
+            org.apache.paimon.types.MapType oldMapType = (org.apache.paimon.types.MapType) oldType;
+            org.apache.paimon.types.MapType newMapType = (org.apache.paimon.types.MapType) newType;
+            Preconditions.checkArgument(
+                    oldMapType.getKeyType().equals(newMapType.getKeyType()),
+                    "Cannot update key type of column %s from %s type to %s type",
+                    joinedNames,
+                    oldMapType.getKeyType(),
+                    newMapType.getKeyType());
+            generateNestedColumnUpdates(
+                    fieldNames,
+                    oldMapType.getValueType(),
+                    newMapType.getValueType(),
+                    schemaChanges);
         } else {
             if (!oldType.equalsIgnoreNullable(newType)) {
                 schemaChanges.add(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
index a2ef1d5c8acec..a8e8332156b37 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SchemaChangeITCase.java
@@ -29,6 +29,7 @@
 import org.junit.jupiter.params.provider.ValueSource;
 
 import java.time.format.DateTimeFormatter;
+import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
@@ -1133,6 +1134,69 @@ public void testUpdateNestedColumn(String formatType) {
 
         assertThatCode(() -> sql("ALTER TABLE T MODIFY (v ROW(f1 BIGINT, f2 INT, f3 STRING))"))
                 .hasRootCauseMessage(
-                        "Column v.f2 can only be updated to row type, and cannot be updated to INT type");
+                        "Column v.f2 can only be updated to row type, and cannot be updated to INTEGER type");
+    }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testUpdateRowInArrayAndMap(String formatType) {
+        sql(
+                "CREATE TABLE T "
+                        + "( k INT, v1 ARRAY<ROW(f1 INT, f2 STRING)>, v2 MAP<INT, ROW(f1 STRING, f2 INT)>, PRIMARY KEY (k) NOT ENFORCED ) "
+                        + "WITH ( 'bucket' = '1', 'file.format' = '"
+                        + formatType
+                        + "' )");
+        sql(
+                "INSERT INTO T VALUES "
+                        + "(1, ARRAY[ROW(100, 'apple'), ROW(101, 'banana')], MAP[100, ROW('cat', 1000), 101, ROW('dog', 1001)]), "
+                        + "(2, ARRAY[ROW(200, 'pear'), ROW(201, 'grape')], MAP[200, ROW('tiger', 2000), 201, ROW('wolf', 2001)])");
+
+        Map<Integer, Row> map1 = new HashMap<>();
+        map1.put(100, Row.of("cat", 1000));
+        map1.put(101, Row.of("dog", 1001));
+        Map<Integer, Row> map2 = new HashMap<>();
+        map2.put(200, Row.of("tiger", 2000));
+        map2.put(201, Row.of("wolf", 2001));
+        assertThat(sql("SELECT * FROM T"))
+                .containsExactlyInAnyOrder(
+                        Row.of(1, new Row[] {Row.of(100, "apple"), Row.of(101, "banana")}, map1),
+                        Row.of(2, new Row[] {Row.of(200, "pear"), Row.of(201, "grape")}, map2));
+
+        sql(
+                "ALTER TABLE T MODIFY (v1 ARRAY<ROW(f1 BIGINT, f2 STRING, f3 STRING)>, v2 MAP<INT, ROW(f3 DOUBLE, f2 INT)>)");
+        sql(
+                "INSERT INTO T VALUES "
+                        + "(1, ARRAY[ROW(1000000000000, 'apple', 'A'), ROW(1000000000001, 'banana', 'B')], MAP[100, ROW(1000.0, 1000), 101, ROW(1001.0, 1001)]), "
+                        + "(3, ARRAY[ROW(3000000000000, 'mango', 'M'), ROW(3000000000001, 'cherry', 'C')], MAP[300, ROW(3000.0, 3000), 301, ROW(3001.0, 3001)])");
+
+        map1.clear();
+        map1.put(100, Row.of(1000.0, 1000));
+        map1.put(101, Row.of(1001.0, 1001));
+        map2.clear();
+        map2.put(200, Row.of(null, 2000));
+        map2.put(201, Row.of(null, 2001));
+        Map<Integer, Row> map3 = new HashMap<>();
+        map3.put(300, Row.of(3000.0, 3000));
+        map3.put(301, Row.of(3001.0, 3001));
+        assertThat(sql("SELECT v2, v1, k FROM T"))
+                .containsExactlyInAnyOrder(
+                        Row.of(
+                                map1,
+                                new Row[] {
+                                    Row.of(1000000000000L, "apple", "A"),
+                                    Row.of(1000000000001L, "banana", "B")
+                                },
+                                1),
+                        Row.of(
+                                map2,
+                                new Row[] {Row.of(200L, "pear", null), Row.of(201L, "grape", null)},
+                                2),
+                        Row.of(
+                                map3,
+                                new Row[] {
+                                    Row.of(3000000000000L, "mango", "M"),
+                                    Row.of(3000000000001L, "cherry", "C")
+                                },
+                                3));
     }
 }

From 9e4b28ae27a786fa9833571556560ce0b9c07f01 Mon Sep 17 00:00:00 2001
From: WenjunMin <aitozi@apache.org>
Date: Thu, 14 Nov 2024 18:39:54 +0800
Subject: [PATCH 019/157] [core] Introduce binlog system table to pack the UB
 and UA (#4520)

---
 docs/content/maintenance/system-tables.md     |  19 +++
 .../paimon/reader/PackChangelogReader.java    | 131 +++++++++++++++
 .../paimon/table/system/AuditLogTable.java    |  12 +-
 .../paimon/table/system/BinlogTable.java      | 151 ++++++++++++++++++
 .../table/system/SystemTableLoader.java       |   2 +
 paimon-flink/paimon-flink-common/pom.xml      |   6 +
 .../paimon/flink/SystemTableITCase.java       |  66 ++++++++
 7 files changed, 381 insertions(+), 6 deletions(-)
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/reader/PackChangelogReader.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SystemTableITCase.java

diff --git a/docs/content/maintenance/system-tables.md b/docs/content/maintenance/system-tables.md
index 462f8c27f887d..0246d6faf8dc5 100644
--- a/docs/content/maintenance/system-tables.md
+++ b/docs/content/maintenance/system-tables.md
@@ -406,4 +406,23 @@ SELECT * FROM T$statistics;
 1 rows in set
 */
 ```
+### Binlog Table
+
+You can streaming or batch query the binlog through binlog table. In this system table,
+the update before and update after will be packed in one row. 
+
+```
+/*
++------------------+----------------------+-----------------------+
+|     rowkind      |       column_0       |       column_1        |
++------------------+----------------------+-----------------------+
+|        +I        |       [col_0]        |       [col_1]         |
++------------------+----------------------+-----------------------+
+|        +U        | [col_0_ub, col_0_ua] | [col_1_ub, col_1_ua]  |
++------------------+----------------------+-----------------------+
+|        -D        |       [col_0]        |       [col_1]         |
++------------------+----------------------+-----------------------+
+*/
+```
+
 
diff --git a/paimon-common/src/main/java/org/apache/paimon/reader/PackChangelogReader.java b/paimon-common/src/main/java/org/apache/paimon/reader/PackChangelogReader.java
new file mode 100644
index 0000000000000..a60780ff5e065
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/reader/PackChangelogReader.java
@@ -0,0 +1,131 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.reader;
+
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.serializer.InternalRowSerializer;
+import org.apache.paimon.types.RowKind;
+import org.apache.paimon.types.RowType;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+import java.util.function.BiFunction;
+
+/** The reader which will pack the update before and update after message together. */
+public class PackChangelogReader implements RecordReader<InternalRow> {
+
+    private final RecordReader<InternalRow> reader;
+    private final BiFunction<InternalRow, InternalRow, InternalRow> function;
+    private final InternalRowSerializer serializer;
+    private boolean initialized = false;
+
+    public PackChangelogReader(
+            RecordReader<InternalRow> reader,
+            BiFunction<InternalRow, InternalRow, InternalRow> function,
+            RowType rowType) {
+        this.reader = reader;
+        this.function = function;
+        this.serializer = new InternalRowSerializer(rowType);
+    }
+
+    @Nullable
+    @Override
+    public RecordIterator<InternalRow> readBatch() throws IOException {
+        if (!initialized) {
+            initialized = true;
+            return new InternRecordIterator(reader, function, serializer);
+        }
+        return null;
+    }
+
+    @Override
+    public void close() throws IOException {
+        reader.close();
+    }
+
+    private static class InternRecordIterator implements RecordIterator<InternalRow> {
+
+        private RecordIterator<InternalRow> currentBatch;
+
+        private final BiFunction<InternalRow, InternalRow, InternalRow> function;
+        private final RecordReader<InternalRow> reader;
+        private final InternalRowSerializer serializer;
+        private boolean endOfData;
+
+        public InternRecordIterator(
+                RecordReader<InternalRow> reader,
+                BiFunction<InternalRow, InternalRow, InternalRow> function,
+                InternalRowSerializer serializer) {
+            this.reader = reader;
+            this.function = function;
+            this.serializer = serializer;
+            this.endOfData = false;
+        }
+
+        @Nullable
+        @Override
+        public InternalRow next() throws IOException {
+            InternalRow row1 = nextRow();
+            if (row1 == null) {
+                return null;
+            }
+            InternalRow row2 = null;
+            if (row1.getRowKind() == RowKind.UPDATE_BEFORE) {
+                row1 = serializer.copy(row1);
+                row2 = nextRow();
+            }
+            return function.apply(row1, row2);
+        }
+
+        @Nullable
+        private InternalRow nextRow() throws IOException {
+            InternalRow row = null;
+            while (!endOfData && row == null) {
+                RecordIterator<InternalRow> batch = nextBatch();
+                if (batch == null) {
+                    endOfData = true;
+                    return null;
+                }
+
+                row = batch.next();
+                if (row == null) {
+                    releaseBatch();
+                }
+            }
+            return row;
+        }
+
+        @Nullable
+        private RecordIterator<InternalRow> nextBatch() throws IOException {
+            if (currentBatch == null) {
+                currentBatch = reader.readBatch();
+            }
+            return currentBatch;
+        }
+
+        @Override
+        public void releaseBatch() {
+            if (currentBatch != null) {
+                currentBatch.releaseBatch();
+                currentBatch = null;
+            }
+        }
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
index e0acd9fb38ea6..7438f9393d604 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
@@ -526,13 +526,13 @@ public DataTableScan withShard(int indexOfThisSubtask, int numberOfParallelSubta
         }
     }
 
-    private class AuditLogRead implements InnerTableRead {
+    class AuditLogRead implements InnerTableRead {
 
-        private final InnerTableRead dataRead;
+        protected final InnerTableRead dataRead;
 
-        private int[] readProjection;
+        protected int[] readProjection;
 
-        private AuditLogRead(InnerTableRead dataRead) {
+        protected AuditLogRead(InnerTableRead dataRead) {
             this.dataRead = dataRead.forceKeepDelete();
             this.readProjection = defaultProjection();
         }
@@ -600,9 +600,9 @@ private InternalRow convertRow(InternalRow data) {
     }
 
     /** A {@link ProjectedRow} which returns row kind when mapping index is negative. */
-    private static class AuditLogRow extends ProjectedRow {
+    static class AuditLogRow extends ProjectedRow {
 
-        private AuditLogRow(int[] indexMapping, InternalRow row) {
+        AuditLogRow(int[] indexMapping, InternalRow row) {
             super(indexMapping);
             replaceRow(row);
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
new file mode 100644
index 0000000000000..96f9f6ed6185f
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
@@ -0,0 +1,151 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.table.system;
+
+import org.apache.paimon.data.GenericArray;
+import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.reader.PackChangelogReader;
+import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.table.Table;
+import org.apache.paimon.table.source.DataSplit;
+import org.apache.paimon.table.source.InnerTableRead;
+import org.apache.paimon.table.source.Split;
+import org.apache.paimon.types.ArrayType;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.RowType;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Map;
+
+import static org.apache.paimon.catalog.Catalog.SYSTEM_TABLE_SPLITTER;
+
+/**
+ * A {@link Table} for reading binlog of table. The binlog format is as below.
+ *
+ * <p>INSERT: [+I, [co1, null], [col2, null]]
+ *
+ * <p>UPDATE: [+U, [co1_ub, col1_ua], [col2_ub, col2_ua]]
+ *
+ * <p>DELETE: [-D, [co1, null], [col2, null]]
+ */
+public class BinlogTable extends AuditLogTable {
+
+    public static final String BINLOG = "binlog";
+
+    private final FileStoreTable wrapped;
+
+    public BinlogTable(FileStoreTable wrapped) {
+        super(wrapped);
+        this.wrapped = wrapped;
+    }
+
+    @Override
+    public String name() {
+        return wrapped.name() + SYSTEM_TABLE_SPLITTER + BINLOG;
+    }
+
+    @Override
+    public RowType rowType() {
+        List<DataField> fields = new ArrayList<>();
+        fields.add(SpecialFields.ROW_KIND);
+        for (DataField field : wrapped.rowType().getFields()) {
+            DataField newField =
+                    new DataField(
+                            field.id(),
+                            field.name(),
+                            new ArrayType(field.type().nullable()), // convert to nullable
+                            field.description());
+            fields.add(newField);
+        }
+        return new RowType(fields);
+    }
+
+    @Override
+    public InnerTableRead newRead() {
+        return new BinlogRead(wrapped.newRead());
+    }
+
+    @Override
+    public Table copy(Map<String, String> dynamicOptions) {
+        return new BinlogTable(wrapped.copy(dynamicOptions));
+    }
+
+    private class BinlogRead extends AuditLogRead {
+
+        private BinlogRead(InnerTableRead dataRead) {
+            super(dataRead);
+        }
+
+        @Override
+        public RecordReader<InternalRow> createReader(Split split) throws IOException {
+            DataSplit dataSplit = (DataSplit) split;
+            if (dataSplit.isStreaming()) {
+                return new PackChangelogReader(
+                        dataRead.createReader(split),
+                        (row1, row2) ->
+                                new AuditLogRow(
+                                        readProjection,
+                                        convertToArray(
+                                                row1, row2, wrapped.rowType().fieldGetters())),
+                        wrapped.rowType());
+            } else {
+                return dataRead.createReader(split)
+                        .transform(
+                                (row) ->
+                                        new AuditLogRow(
+                                                readProjection,
+                                                convertToArray(
+                                                        row,
+                                                        null,
+                                                        wrapped.rowType().fieldGetters())));
+            }
+        }
+
+        private InternalRow convertToArray(
+                InternalRow row1,
+                @Nullable InternalRow row2,
+                InternalRow.FieldGetter[] fieldGetters) {
+            GenericRow row = new GenericRow(row1.getFieldCount());
+            for (int i = 0; i < row1.getFieldCount(); i++) {
+                Object o1 = fieldGetters[i].getFieldOrNull(row1);
+                Object o2;
+                if (row2 != null) {
+                    o2 = fieldGetters[i].getFieldOrNull(row2);
+                    row.setField(i, new GenericArray(new Object[] {o1, o2}));
+                } else {
+                    row.setField(i, new GenericArray(new Object[] {o1}));
+                }
+            }
+            // If no row2 provided, then follow the row1 kind.
+            if (row2 == null) {
+                row.setRowKind(row1.getRowKind());
+            } else {
+                row.setRowKind(row2.getRowKind());
+            }
+            return row;
+        }
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
index a84f41ec1a514..3d5b211316ec1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
@@ -41,6 +41,7 @@
 import static org.apache.paimon.table.system.AggregationFieldsTable.AGGREGATION_FIELDS;
 import static org.apache.paimon.table.system.AllTableOptionsTable.ALL_TABLE_OPTIONS;
 import static org.apache.paimon.table.system.AuditLogTable.AUDIT_LOG;
+import static org.apache.paimon.table.system.BinlogTable.BINLOG;
 import static org.apache.paimon.table.system.BranchesTable.BRANCHES;
 import static org.apache.paimon.table.system.BucketsTable.BUCKETS;
 import static org.apache.paimon.table.system.CatalogOptionsTable.CATALOG_OPTIONS;
@@ -77,6 +78,7 @@ public class SystemTableLoader {
                     .put(READ_OPTIMIZED, ReadOptimizedTable::new)
                     .put(AGGREGATION_FIELDS, AggregationFieldsTable::new)
                     .put(STATISTICS, StatisticTable::new)
+                    .put(BINLOG, BinlogTable::new)
                     .build();
 
     public static final List<String> SYSTEM_TABLES = new ArrayList<>(SYSTEM_TABLE_LOADERS.keySet());
diff --git a/paimon-flink/paimon-flink-common/pom.xml b/paimon-flink/paimon-flink-common/pom.xml
index 4452af266e5e6..91222983bf6ba 100644
--- a/paimon-flink/paimon-flink-common/pom.xml
+++ b/paimon-flink/paimon-flink-common/pom.xml
@@ -162,6 +162,12 @@ under the License.
             <artifactId>iceberg-data</artifactId>
             <version>${iceberg.version}</version>
             <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <artifactId>parquet-avro</artifactId>
+                    <groupId>org.apache.parquet</groupId>
+                </exclusion>
+            </exclusions>
         </dependency>
     </dependencies>
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SystemTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SystemTableITCase.java
new file mode 100644
index 0000000000000..771f4acc5e585
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SystemTableITCase.java
@@ -0,0 +1,66 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink;
+
+import org.apache.paimon.utils.BlockingIterator;
+
+import org.apache.flink.types.Row;
+import org.junit.jupiter.api.Test;
+
+import java.util.List;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/** ITCase for system table. */
+public class SystemTableITCase extends CatalogTableITCase {
+
+    @Test
+    public void testBinlogTableStreamRead() throws Exception {
+        sql(
+                "CREATE TABLE T (a INT, b INT, primary key (a) NOT ENFORCED) with ('changelog-producer' = 'lookup', "
+                        + "'bucket' = '2')");
+        BlockingIterator<Row, Row> iterator =
+                streamSqlBlockIter("SELECT * FROM T$binlog /*+ OPTIONS('scan.mode' = 'latest') */");
+        sql("INSERT INTO T VALUES (1, 2)");
+        sql("INSERT INTO T VALUES (1, 3)");
+        sql("INSERT INTO T VALUES (2, 2)");
+        List<Row> rows = iterator.collect(3);
+        assertThat(rows)
+                .containsExactly(
+                        Row.of("+I", new Integer[] {1}, new Integer[] {2}),
+                        Row.of("+U", new Integer[] {1, 1}, new Integer[] {2, 3}),
+                        Row.of("+I", new Integer[] {2}, new Integer[] {2}));
+        iterator.close();
+    }
+
+    @Test
+    public void testBinlogTableBatchRead() throws Exception {
+        sql(
+                "CREATE TABLE T (a INT, b INT, primary key (a) NOT ENFORCED) with ('changelog-producer' = 'lookup', "
+                        + "'bucket' = '2')");
+        sql("INSERT INTO T VALUES (1, 2)");
+        sql("INSERT INTO T VALUES (1, 3)");
+        sql("INSERT INTO T VALUES (2, 2)");
+        List<Row> rows = sql("SELECT * FROM T$binlog /*+ OPTIONS('scan.mode' = 'latest') */");
+        assertThat(rows)
+                .containsExactly(
+                        Row.of("+I", new Integer[] {1}, new Integer[] {3}),
+                        Row.of("+I", new Integer[] {2}, new Integer[] {2}));
+    }
+}

From 9b9ed72efaef15f7f3e2333b519bf476c122352b Mon Sep 17 00:00:00 2001
From: WenjunMin <aitozi@apache.org>
Date: Thu, 14 Nov 2024 19:05:20 +0800
Subject: [PATCH 020/157] [doc] Add the query binlog example in doc (#4532)

---
 docs/content/maintenance/system-tables.md | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/docs/content/maintenance/system-tables.md b/docs/content/maintenance/system-tables.md
index 0246d6faf8dc5..5ef5121c25a92 100644
--- a/docs/content/maintenance/system-tables.md
+++ b/docs/content/maintenance/system-tables.md
@@ -408,10 +408,11 @@ SELECT * FROM T$statistics;
 ```
 ### Binlog Table
 
-You can streaming or batch query the binlog through binlog table. In this system table,
-the update before and update after will be packed in one row. 
+You can query the binlog through binlog table. In the binlog system table, the update before and update after will be packed in one row. 
+
+```sql
+SELECT * FROM T$binlog;
 
-```
 /*
 +------------------+----------------------+-----------------------+
 |     rowkind      |       column_0       |       column_1        |

From 6f515203e3edf8c8ecc852054d111c8fc5e54cc4 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 14 Nov 2024 19:19:13 +0800
Subject: [PATCH 021/157] [hotfix] Fix comments in BinlogTable

---
 .../main/java/org/apache/paimon/table/system/BinlogTable.java | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
index 96f9f6ed6185f..b17d61d44e776 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
@@ -45,11 +45,11 @@
 /**
  * A {@link Table} for reading binlog of table. The binlog format is as below.
  *
- * <p>INSERT: [+I, [co1, null], [col2, null]]
+ * <p>INSERT: [+I, [co1], [col2]]
  *
  * <p>UPDATE: [+U, [co1_ub, col1_ua], [col2_ub, col2_ua]]
  *
- * <p>DELETE: [-D, [co1, null], [col2, null]]
+ * <p>DELETE: [-D, [co1], [col2]]
  */
 public class BinlogTable extends AuditLogTable {
 

From bf8f5598d9a48f907f2346df39507c27877a5952 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Thu, 14 Nov 2024 20:28:30 +0800
Subject: [PATCH 022/157] [parquet] Fix that cannot read parquet ROW<DECIMAL>
 data (#4533)

---
 .../columnar/heap/AbstractHeapVector.java     |  4 +-
 .../data/columnar/heap/ElementCountable.java  | 23 ++------
 .../paimon/flink/BatchFileStoreITCase.java    | 19 ++++++
 .../format/parquet/ParquetReaderFactory.java  |  6 +-
 .../parquet/reader/NestedColumnReader.java    |  3 +-
 .../reader/NestedPrimitiveColumnReader.java   |  6 +-
 .../parquet/reader/ParquetDecimalVector.java  | 16 ++++-
 .../parquet/reader/RowColumnReader.java       | 59 -------------------
 8 files changed, 50 insertions(+), 86 deletions(-)
 rename paimon-format/src/main/java/org/apache/paimon/format/parquet/position/RowPosition.java => paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/ElementCountable.java (60%)
 delete mode 100644 paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RowColumnReader.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/AbstractHeapVector.java b/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/AbstractHeapVector.java
index 702877642327c..f0e82eac4fb10 100644
--- a/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/AbstractHeapVector.java
+++ b/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/AbstractHeapVector.java
@@ -25,7 +25,8 @@
 import java.util.Arrays;
 
 /** Heap vector that nullable shared structure. */
-public abstract class AbstractHeapVector extends AbstractWritableVector {
+public abstract class AbstractHeapVector extends AbstractWritableVector
+        implements ElementCountable {
 
     public static final boolean LITTLE_ENDIAN = ByteOrder.nativeOrder() == ByteOrder.LITTLE_ENDIAN;
 
@@ -116,6 +117,7 @@ public HeapIntVector getDictionaryIds() {
         return dictionaryIds;
     }
 
+    @Override
     public int getLen() {
         return this.len;
     }
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/RowPosition.java b/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/ElementCountable.java
similarity index 60%
rename from paimon-format/src/main/java/org/apache/paimon/format/parquet/position/RowPosition.java
rename to paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/ElementCountable.java
index fb6378349007d..a32762d659fd0 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/RowPosition.java
+++ b/paimon-common/src/main/java/org/apache/paimon/data/columnar/heap/ElementCountable.java
@@ -16,25 +16,10 @@
  * limitations under the License.
  */
 
-package org.apache.paimon.format.parquet.position;
+package org.apache.paimon.data.columnar.heap;
 
-import javax.annotation.Nullable;
+/** Container with a known number of elements. */
+public interface ElementCountable {
 
-/** To represent struct's position in repeated type. */
-public class RowPosition {
-    @Nullable private final boolean[] isNull;
-    private final int positionsCount;
-
-    public RowPosition(boolean[] isNull, int positionsCount) {
-        this.isNull = isNull;
-        this.positionsCount = positionsCount;
-    }
-
-    public boolean[] getIsNull() {
-        return isNull;
-    }
-
-    public int getPositionsCount() {
-        return positionsCount;
-    }
+    int getLen();
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BatchFileStoreITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BatchFileStoreITCase.java
index c30e6cd5612d3..cdc114b048a11 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BatchFileStoreITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BatchFileStoreITCase.java
@@ -34,6 +34,7 @@
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.ValueSource;
 
+import java.math.BigDecimal;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
@@ -573,6 +574,24 @@ public void testCountStarPK() {
         validateCount1NotPushDown(sql);
     }
 
+    @Test
+    public void testParquetRowDecimalAndTimestamp() {
+        sql(
+                "CREATE TABLE parquet_row_decimal(`row` ROW<f0 DECIMAL(2,1)>) WITH ('file.format' = 'parquet')");
+        sql("INSERT INTO parquet_row_decimal VALUES ( (ROW(1.2)) )");
+
+        assertThat(sql("SELECT * FROM parquet_row_decimal"))
+                .containsExactly(Row.of(Row.of(new BigDecimal("1.2"))));
+
+        sql(
+                "CREATE TABLE parquet_row_timestamp(`row` ROW<f0 TIMESTAMP(0)>) WITH ('file.format' = 'parquet')");
+        sql("INSERT INTO parquet_row_timestamp VALUES ( (ROW(TIMESTAMP'2024-11-13 18:00:00')) )");
+
+        assertThat(sql("SELECT * FROM parquet_row_timestamp"))
+                .containsExactly(
+                        Row.of(Row.of(DateTimeUtils.toLocalDateTime("2024-11-13 18:00:00", 0))));
+    }
+
     private void validateCount1PushDown(String sql) {
         Transformation<?> transformation = AbstractTestBase.translate(tEnv, sql);
         while (!transformation.getInputs().isEmpty()) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index 53b4b1634b5fc..f0151d6f3d8fb 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.data.columnar.ColumnarRow;
 import org.apache.paimon.data.columnar.ColumnarRowIterator;
 import org.apache.paimon.data.columnar.VectorizedColumnBatch;
+import org.apache.paimon.data.columnar.heap.ElementCountable;
 import org.apache.paimon.data.columnar.writable.WritableColumnVector;
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.format.parquet.reader.ColumnReader;
@@ -293,7 +294,10 @@ private VectorizedColumnBatch createVectorizedColumnBatch(
         for (int i = 0; i < writableVectors.length; i++) {
             switch (projectedFields[i].type().getTypeRoot()) {
                 case DECIMAL:
-                    vectors[i] = new ParquetDecimalVector(writableVectors[i]);
+                    vectors[i] =
+                            new ParquetDecimalVector(
+                                    writableVectors[i],
+                                    ((ElementCountable) writableVectors[i]).getLen());
                     break;
                 case TIMESTAMP_WITHOUT_TIME_ZONE:
                 case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
index c89c77603dac2..68225fbd13207 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.data.columnar.ColumnVector;
 import org.apache.paimon.data.columnar.heap.AbstractHeapVector;
+import org.apache.paimon.data.columnar.heap.ElementCountable;
 import org.apache.paimon.data.columnar.heap.HeapArrayVector;
 import org.apache.paimon.data.columnar.heap.HeapMapVector;
 import org.apache.paimon.data.columnar.heap.HeapRowVector;
@@ -134,7 +135,7 @@ private Pair<LevelDelegation, WritableColumnVector> readRow(
                     String.format("Row field does not have any children: %s.", field));
         }
 
-        int len = ((AbstractHeapVector) finalChildrenVectors[0]).getLen();
+        int len = ((ElementCountable) finalChildrenVectors[0]).getLen();
         boolean[] isNull = new boolean[len];
         Arrays.fill(isNull, true);
         boolean hasNull = false;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
index 7ee33a0bb5cc8..7d00ff79234ae 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
@@ -495,7 +495,7 @@ private WritableColumnVector fillColumnVector(int total, List valueList) {
                                 phiv.vector[i] = ((List<Integer>) valueList).get(i);
                             }
                         }
-                        return new ParquetDecimalVector(phiv);
+                        return new ParquetDecimalVector(phiv, total);
                     case INT64:
                         HeapLongVector phlv = new HeapLongVector(total);
                         for (int i = 0; i < valueList.size(); i++) {
@@ -505,10 +505,10 @@ private WritableColumnVector fillColumnVector(int total, List valueList) {
                                 phlv.vector[i] = ((List<Long>) valueList).get(i);
                             }
                         }
-                        return new ParquetDecimalVector(phlv);
+                        return new ParquetDecimalVector(phlv, total);
                     default:
                         HeapBytesVector phbv = getHeapBytesVector(total, valueList);
-                        return new ParquetDecimalVector(phbv);
+                        return new ParquetDecimalVector(phbv, total);
                 }
             default:
                 throw new RuntimeException("Unsupported type in the list: " + type);
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetDecimalVector.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetDecimalVector.java
index 28d308bac61f5..42714ab066dae 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetDecimalVector.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetDecimalVector.java
@@ -25,6 +25,7 @@
 import org.apache.paimon.data.columnar.Dictionary;
 import org.apache.paimon.data.columnar.IntColumnVector;
 import org.apache.paimon.data.columnar.LongColumnVector;
+import org.apache.paimon.data.columnar.heap.ElementCountable;
 import org.apache.paimon.data.columnar.writable.WritableBytesVector;
 import org.apache.paimon.data.columnar.writable.WritableColumnVector;
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
@@ -38,12 +39,18 @@
  * {@link DecimalColumnVector} interface.
  */
 public class ParquetDecimalVector
-        implements DecimalColumnVector, WritableLongVector, WritableIntVector, WritableBytesVector {
+        implements DecimalColumnVector,
+                WritableLongVector,
+                WritableIntVector,
+                WritableBytesVector,
+                ElementCountable {
 
     private final ColumnVector vector;
+    private final int len;
 
-    public ParquetDecimalVector(ColumnVector vector) {
+    public ParquetDecimalVector(ColumnVector vector, int len) {
         this.vector = vector;
+        this.len = len;
     }
 
     @Override
@@ -225,4 +232,9 @@ public void fill(long value) {
             ((WritableLongVector) vector).fill(value);
         }
     }
+
+    @Override
+    public int getLen() {
+        return len;
+    }
 }
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RowColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RowColumnReader.java
deleted file mode 100644
index fa2da03ef312f..0000000000000
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RowColumnReader.java
+++ /dev/null
@@ -1,59 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.format.parquet.reader;
-
-import org.apache.paimon.data.columnar.heap.HeapRowVector;
-import org.apache.paimon.data.columnar.writable.WritableColumnVector;
-
-import java.io.IOException;
-import java.util.List;
-
-/** Row {@link ColumnReader}. */
-public class RowColumnReader implements ColumnReader<WritableColumnVector> {
-
-    private final List<ColumnReader> fieldReaders;
-
-    public RowColumnReader(List<ColumnReader> fieldReaders) {
-        this.fieldReaders = fieldReaders;
-    }
-
-    @Override
-    public void readToVector(int readNumber, WritableColumnVector vector) throws IOException {
-        HeapRowVector rowVector = (HeapRowVector) vector;
-        WritableColumnVector[] vectors = rowVector.getFields();
-        // row vector null array
-        boolean[] isNulls = new boolean[readNumber];
-        for (int i = 0; i < vectors.length; i++) {
-            fieldReaders.get(i).readToVector(readNumber, vectors[i]);
-
-            for (int j = 0; j < readNumber; j++) {
-                if (i == 0) {
-                    isNulls[j] = vectors[i].isNullAt(j);
-                } else {
-                    isNulls[j] = isNulls[j] && vectors[i].isNullAt(j);
-                }
-                if (i == vectors.length - 1 && isNulls[j]) {
-                    // rowColumnVector[j] is null only when all fields[j] of rowColumnVector[j] is
-                    // null
-                    rowVector.setNullAt(j);
-                }
-            }
-        }
-    }
-}

From 8b772071df5516a60cf9dc2f0b1029ecea36adee Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 14 Nov 2024 22:55:52 +0800
Subject: [PATCH 023/157] [doc] Update roadmap

---
 docs/content/project/roadmap.md | 49 ++++-----------------------------
 1 file changed, 6 insertions(+), 43 deletions(-)

diff --git a/docs/content/project/roadmap.md b/docs/content/project/roadmap.md
index 2f6b63af00a10..34628e28c80f4 100644
--- a/docs/content/project/roadmap.md
+++ b/docs/content/project/roadmap.md
@@ -26,16 +26,6 @@ under the License.
 
 # Roadmap
 
-## Native Format IO
-
-Integrate native Parquet & ORC reader & writer.
-
-## Deletion Vectors (Merge On Write)
-
-1. Primary Key Table Deletion Vectors Mode supports async compaction.
-2. Append Table supports DELETE & UPDATE with Deletion Vectors Mode. (Now only Spark SQL)
-3. Optimize lookup performance for HDD disk.
-
 ## Flink Lookup Join
 
 Support Flink Custom Data Distribution Lookup Join to reach large-scale data lookup join.
@@ -44,51 +34,24 @@ Support Flink Custom Data Distribution Lookup Join to reach large-scale data loo
 
 Introduce a mode to produce Iceberg snapshots.
 
-## Branch
-
-Branch production ready.
-
-## Changelog life cycle decouple
-
-Changelog life cycle decouple supports none changelog-producer.
-
-## Partition Mark Done
-
-Support partition mark done.
-
-## Default File Format
-
-- Default compression is ZSTD with level 1.
-- Parquet supports filter push down.
-- Parquet supports arrow with row type element.
-- Parquet becomes default file format.
-
 ## Variant Type
 
 Support Variant Type with Spark 4.0 and Flink 2.0. Unlocking support for semi-structured data.
 
-## Bucketed Join
-
-Support Bucketed Join with Spark SQL to reduce shuffler in Join.
-
 ## File Index
 
 Add more index:
-1. Bitmap
-2. Inverse
 
-## Column Family
+1. Inverse
+
+## Vector Compaction
 
-Support Column Family for super Wide Table.
+Support Vector Compaction for super Wide Table.
 
-## View & Function support
+## Function support
 
-Paimon Catalog supports views and functions.
+Paimon Catalog supports functions.
 
 ## Files Schema Evolution Ingestion
 
 Introduce a files Ingestion with Schema Evolution.
-
-## Foreign Key Join
-
-Explore Foreign Key Join solution.

From d3384ac16d0ee955918f4ba8d2ddc756570877e4 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 14 Nov 2024 23:01:32 +0800
Subject: [PATCH 024/157] [doc] Add doc to 'partition.mark-done-action'

---
 docs/content/flink/sql-write.md | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 008fe498363cd..33adac5fb7f49 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -257,7 +257,8 @@ CREATE TABLE my_partitioned_table (
     'partition.timestamp-formatter'='yyyyMMdd',
     'partition.timestamp-pattern'='$dt',
     'partition.time-interval'='1 d',
-    'partition.idle-time-to-done'='15 m'
+    'partition.idle-time-to-done'='15 m',
+    'partition.mark-done-action'='done-partition'
 );
 ```
 
@@ -267,4 +268,5 @@ CREATE TABLE my_partitioned_table (
    and then it will be marked as done.
 3. Thirdly, by default, partition mark done will create _SUCCESS file, the content of _SUCCESS file is a json, contains
    `creationTime` and `modificationTime`, they can help you understand if there is any delayed data. You can also
-   configure other actions.
+   configure other actions, like `'done-partition'`, for example, partition `'dt=20240501'` with produce
+   `'dt=20240501.done'` done partition.

From 203db415d519106d9f3d20a0fe83af58c71e78ea Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Mon, 18 Nov 2024 13:36:32 +0800
Subject: [PATCH 025/157] [core] Fix that batch unaware bucket compact cannot
 stop when there is no snapshot (#4539)

---
 .../UnawareAppendTableCompactionCoordinator.java      |  3 +++
 .../UnawareAppendTableCompactionCoordinatorTest.java  | 11 +++++++++++
 2 files changed, 14 insertions(+)

diff --git a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
index 9a54ea72e7cc9..842b223167b27 100644
--- a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
+++ b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
@@ -387,6 +387,9 @@ private void assignNewIterator() {
             if (nextSnapshot == null) {
                 nextSnapshot = snapshotManager.latestSnapshotId();
                 if (nextSnapshot == null) {
+                    if (!streamingMode) {
+                        throw new EndOfScanException();
+                    }
                     return;
                 }
                 snapshotReader.withMode(ScanMode.ALL);
diff --git a/paimon-core/src/test/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinatorTest.java b/paimon-core/src/test/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinatorTest.java
index 95826c195ec72..9bb461ffe151c 100644
--- a/paimon-core/src/test/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinatorTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinatorTest.java
@@ -29,6 +29,7 @@
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.FileStoreTableFactory;
+import org.apache.paimon.table.source.EndOfScanException;
 import org.apache.paimon.types.DataTypes;
 
 import org.junit.jupiter.api.BeforeEach;
@@ -43,7 +44,9 @@
 
 import static org.apache.paimon.mergetree.compact.MergeTreeCompactManagerTest.row;
 import static org.apache.paimon.stats.StatsTestUtils.newSimpleStats;
+import static org.apache.paimon.testutils.assertj.PaimonAssertions.anyCauseMatches;
 import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
 /** Tests for {@link UnawareAppendTableCompactionCoordinator}. */
 public class UnawareAppendTableCompactionCoordinatorTest {
@@ -135,6 +138,14 @@ public void testAgeGrowUp() {
                 .isEqualTo(0);
     }
 
+    @Test
+    public void testBatchScanEmptyTable() {
+        compactionCoordinator =
+                new UnawareAppendTableCompactionCoordinator(appendOnlyFileStoreTable, false);
+        assertThatThrownBy(() -> compactionCoordinator.scan())
+                .satisfies(anyCauseMatches(EndOfScanException.class));
+    }
+
     private void assertTasks(List<DataFileMeta> files, int taskNum) {
         compactionCoordinator.notifyNewFiles(partition, files);
         List<UnawareAppendCompactionTask> tasks = compactionCoordinator.compactPlan();

From 220789d5ab4c566f72584d2b85980c777fd7807d Mon Sep 17 00:00:00 2001
From: wangwj <hongli.wwj@gmail.com>
Date: Mon, 18 Nov 2024 15:20:42 +0800
Subject: [PATCH 026/157] [core] support drop stats in result of scan plan
 (#4506)

---
 .../org/apache/paimon/io/DataFileMeta.java    | 21 ++++++++++++++++++
 .../apache/paimon/manifest/ManifestEntry.java |  4 ++++
 .../operation/AbstractFileStoreScan.java      | 13 +++++++++++
 .../paimon/operation/FileStoreScan.java       |  2 ++
 .../table/source/AbstractDataTableScan.java   |  6 +++++
 .../paimon/table/source/InnerTableScan.java   |  5 +++++
 .../paimon/table/source/ReadBuilder.java      |  3 +++
 .../paimon/table/source/ReadBuilderImpl.java  | 11 ++++++++++
 .../table/source/snapshot/SnapshotReader.java |  2 ++
 .../source/snapshot/SnapshotReaderImpl.java   |  6 +++++
 .../paimon/table/system/AuditLogTable.java    |  6 +++++
 .../operation/KeyValueFileStoreScanTest.java  | 22 +++++++++++++++++++
 .../source/ContinuousFileStoreSource.java     |  2 +-
 .../paimon/flink/source/FlinkTableSource.java |  8 ++++++-
 .../flink/source/StaticFileStoreSource.java   |  2 +-
 .../source/operator/MonitorFunction.java      |  2 +-
 16 files changed, 111 insertions(+), 4 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/DataFileMeta.java b/paimon-core/src/main/java/org/apache/paimon/io/DataFileMeta.java
index b6cac5ae51304..bb9e45ff002da 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/DataFileMeta.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/DataFileMeta.java
@@ -409,6 +409,27 @@ public DataFileMeta rename(String newFileName) {
                 valueStatsCols);
     }
 
+    public DataFileMeta copyWithoutStats() {
+        return new DataFileMeta(
+                fileName,
+                fileSize,
+                rowCount,
+                minKey,
+                maxKey,
+                keyStats,
+                EMPTY_STATS,
+                minSequenceNumber,
+                maxSequenceNumber,
+                schemaId,
+                level,
+                extraFiles,
+                creationTime,
+                deleteRowCount,
+                embeddedIndex,
+                fileSource,
+                Collections.emptyList());
+    }
+
     public List<Path> collectFiles(DataFilePathFactory pathFactory) {
         List<Path> paths = new ArrayList<>();
         paths.add(pathFactory.toPath(fileName));
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
index f7c5c4639a6f2..ee5dc2c344214 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
@@ -121,6 +121,10 @@ public Identifier identifier() {
                 file.embeddedIndex());
     }
 
+    public ManifestEntry copyWithoutStats() {
+        return new ManifestEntry(kind, partition, bucket, totalBuckets, file.copyWithoutStats());
+    }
+
     @Override
     public boolean equals(Object o) {
         if (!(o instanceof ManifestEntry)) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
index 683e6ffda481e..0e1f9357e312c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
@@ -90,6 +90,7 @@ public abstract class AbstractFileStoreScan implements FileStoreScan {
 
     private ManifestCacheFilter manifestCacheFilter = null;
     private ScanMetrics scanMetrics = null;
+    private boolean dropStats;
 
     public AbstractFileStoreScan(
             ManifestsReader manifestsReader,
@@ -105,6 +106,7 @@ public AbstractFileStoreScan(
         this.manifestFileFactory = manifestFileFactory;
         this.tableSchemas = new ConcurrentHashMap<>();
         this.parallelism = parallelism;
+        this.dropStats = false;
     }
 
     @Override
@@ -215,6 +217,12 @@ public FileStoreScan withMetrics(ScanMetrics metrics) {
         return this;
     }
 
+    @Override
+    public FileStoreScan dropStats() {
+        this.dropStats = true;
+        return this;
+    }
+
     @Nullable
     @Override
     public Integer parallelism() {
@@ -291,6 +299,11 @@ public Snapshot snapshot() {
 
             @Override
             public List<ManifestEntry> files() {
+                if (dropStats) {
+                    return files.stream()
+                            .map(ManifestEntry::copyWithoutStats)
+                            .collect(Collectors.toList());
+                }
                 return files;
             }
         };
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
index bc0d7ff27301a..e643bf1617b4d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
@@ -81,6 +81,8 @@ public interface FileStoreScan {
 
     FileStoreScan withMetrics(ScanMetrics metrics);
 
+    FileStoreScan dropStats();
+
     @Nullable
     Integer parallelism();
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/AbstractDataTableScan.java b/paimon-core/src/main/java/org/apache/paimon/table/source/AbstractDataTableScan.java
index 6a8aa9265e5c6..24c6943f546fe 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/AbstractDataTableScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/AbstractDataTableScan.java
@@ -102,6 +102,12 @@ public AbstractDataTableScan withMetricsRegistry(MetricRegistry metricsRegistry)
         return this;
     }
 
+    @Override
+    public AbstractDataTableScan dropStats() {
+        snapshotReader.dropStats();
+        return this;
+    }
+
     public CoreOptions options() {
         return options;
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/InnerTableScan.java b/paimon-core/src/main/java/org/apache/paimon/table/source/InnerTableScan.java
index 00a4fc0cde18b..c2425ff16f97f 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/InnerTableScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/InnerTableScan.java
@@ -55,4 +55,9 @@ default InnerTableScan withMetricsRegistry(MetricRegistry metricRegistry) {
         // do nothing, should implement this if need
         return this;
     }
+
+    default InnerTableScan dropStats() {
+        // do nothing, should implement this if need
+        return this;
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilder.java b/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilder.java
index 91d5f1004e914..0c1386ce441d8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilder.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilder.java
@@ -150,6 +150,9 @@ default ReadBuilder withProjection(int[][] projection) {
      */
     ReadBuilder withShard(int indexOfThisSubtask, int numberOfParallelSubtasks);
 
+    /** Delete stats in scan plan result. */
+    ReadBuilder dropStats();
+
     /** Create a {@link TableScan} to perform batch planning. */
     TableScan newScan();
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilderImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilderImpl.java
index 577b0a20a99b3..95bfe6f24bc77 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilderImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/ReadBuilderImpl.java
@@ -51,6 +51,8 @@ public class ReadBuilderImpl implements ReadBuilder {
 
     private @Nullable RowType readType;
 
+    private boolean dropStats = false;
+
     public ReadBuilderImpl(InnerTable table) {
         this.table = table;
     }
@@ -124,6 +126,12 @@ public ReadBuilder withBucketFilter(Filter<Integer> bucketFilter) {
         return this;
     }
 
+    @Override
+    public ReadBuilder dropStats() {
+        this.dropStats = true;
+        return this;
+    }
+
     @Override
     public TableScan newScan() {
         InnerTableScan tableScan = configureScan(table.newScan());
@@ -156,6 +164,9 @@ private InnerTableScan configureScan(InnerTableScan scan) {
         if (bucketFilter != null) {
             scan.withBucketFilter(bucketFilter);
         }
+        if (dropStats) {
+            scan.dropStats();
+        }
         return scan;
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
index 2dd02be04f7c5..b59cf98bbb4c2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
@@ -85,6 +85,8 @@ public interface SnapshotReader {
 
     SnapshotReader withDataFileNameFilter(Filter<String> fileNameFilter);
 
+    SnapshotReader dropStats();
+
     SnapshotReader withShard(int indexOfThisSubtask, int numberOfParallelSubtasks);
 
     SnapshotReader withMetricRegistry(MetricRegistry registry);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
index f4591734b68e3..7ce537ee52ec1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
@@ -264,6 +264,12 @@ public SnapshotReader withDataFileNameFilter(Filter<String> fileNameFilter) {
         return this;
     }
 
+    @Override
+    public SnapshotReader dropStats() {
+        scan.dropStats();
+        return this;
+    }
+
     @Override
     public SnapshotReader withShard(int indexOfThisSubtask, int numberOfParallelSubtasks) {
         if (splitGenerator.alwaysRawConvertible()) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
index 7438f9393d604..e56ee90412ceb 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
@@ -342,6 +342,12 @@ public SnapshotReader withDataFileNameFilter(Filter<String> fileNameFilter) {
             return this;
         }
 
+        @Override
+        public SnapshotReader dropStats() {
+            wrapped.dropStats();
+            return this;
+        }
+
         @Override
         public SnapshotReader withShard(int indexOfThisSubtask, int numberOfParallelSubtasks) {
             wrapped.withShard(indexOfThisSubtask, numberOfParallelSubtasks);
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
index ce17450538b1b..2fd8c10cd9445 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
@@ -50,6 +50,7 @@
 import java.util.concurrent.ThreadLocalRandom;
 import java.util.stream.Collectors;
 
+import static org.apache.paimon.stats.SimpleStats.EMPTY_STATS;
 import static org.assertj.core.api.Assertions.assertThat;
 
 /** Tests for {@link KeyValueFileStoreScan}. */
@@ -274,6 +275,27 @@ public void testWithManifestList() throws Exception {
         runTestExactMatch(scan, null, expected);
     }
 
+    @Test
+    public void testDropStatsInPlan() throws Exception {
+        ThreadLocalRandom random = ThreadLocalRandom.current();
+        List<KeyValue> data = generateData(100, 0, (long) Math.abs(random.nextInt(1000)));
+        writeData(data, 0);
+        data = generateData(100, 1, (long) Math.abs(random.nextInt(1000)) + 1000);
+        writeData(data, 0);
+        data = generateData(100, 2, (long) Math.abs(random.nextInt(1000)) + 2000);
+        writeData(data, 0);
+        data = generateData(100, 3, (long) Math.abs(random.nextInt(1000)) + 3000);
+        Snapshot snapshot = writeData(data, 0);
+
+        KeyValueFileStoreScan scan = store.newScan();
+        scan.withSnapshot(snapshot.id()).dropStats();
+        List<ManifestEntry> files = scan.plan().files();
+
+        for (ManifestEntry manifestEntry : files) {
+            assertThat(manifestEntry.file().valueStats()).isEqualTo(EMPTY_STATS);
+        }
+    }
+
     private void runTestExactMatch(
             FileStoreScan scan, Long expectedSnapshotId, Map<BinaryRow, BinaryRow> expected)
             throws Exception {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
index 559976921e2e0..b7eb1d625ce3b 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
@@ -77,7 +77,7 @@ public SplitEnumerator<FileStoreSourceSplit, PendingSplitsCheckpoint> restoreEnu
             nextSnapshotId = checkpoint.currentSnapshotId();
             splits = checkpoint.splits();
         }
-        StreamTableScan scan = readBuilder.newStreamScan();
+        StreamTableScan scan = readBuilder.dropStats().newStreamScan();
         if (metricGroup(context) != null) {
             ((StreamDataTableScan) scan)
                     .withMetricsRegistry(new FlinkMetricRegistry(context.metricGroup()));
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
index 2be0248f3ce8c..9bfd36fdfaa81 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
@@ -175,6 +175,7 @@ protected void scanSplitsForInference() {
                 List<PartitionEntry> partitionEntries =
                         table.newReadBuilder()
                                 .withFilter(predicate)
+                                .dropStats()
                                 .newScan()
                                 .listPartitionEntries();
                 long totalSize = 0;
@@ -188,7 +189,12 @@ protected void scanSplitsForInference() {
                         new SplitStatistics((int) (totalSize / splitTargetSize + 1), rowCount);
             } else {
                 List<Split> splits =
-                        table.newReadBuilder().withFilter(predicate).newScan().plan().splits();
+                        table.newReadBuilder()
+                                .withFilter(predicate)
+                                .dropStats()
+                                .newScan()
+                                .plan()
+                                .splits();
                 splitStatistics =
                         new SplitStatistics(
                                 splits.size(), splits.stream().mapToLong(Split::rowCount).sum());
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
index af425aab5e469..c388a6dccbbce 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
@@ -87,7 +87,7 @@ public SplitEnumerator<FileStoreSourceSplit, PendingSplitsCheckpoint> restoreEnu
 
     private List<FileStoreSourceSplit> getSplits(SplitEnumeratorContext context) {
         FileStoreSourceSplitGenerator splitGenerator = new FileStoreSourceSplitGenerator();
-        TableScan scan = readBuilder.newScan();
+        TableScan scan = readBuilder.dropStats().newScan();
         // register scan metrics
         if (context.metricGroup() != null) {
             ((InnerTableScan) scan)
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
index 3805f6f8c536e..f21922670471b 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
@@ -106,7 +106,7 @@ public MonitorFunction(
 
     @Override
     public void initializeState(FunctionInitializationContext context) throws Exception {
-        this.scan = readBuilder.newStreamScan();
+        this.scan = readBuilder.dropStats().newStreamScan();
 
         this.checkpointState =
                 context.getOperatorStateStore()

From 9a334c80d6fc1e4c0bfc13561a25eda674990d29 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Tue, 19 Nov 2024 08:53:19 +0800
Subject: [PATCH 027/157] [hive] Sync db owner prop to hms when creating the db
 (#4544)

---
 .../org/apache/paimon/catalog/Catalog.java    |  6 +++--
 .../org/apache/paimon/hive/HiveCatalog.java   | 11 +++++---
 .../sql/DDLWithHiveCatalogTestBase.scala      | 27 ++++++++-----------
 3 files changed, 23 insertions(+), 21 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/Catalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/Catalog.java
index 6a6a047bd38cd..d919c59782975 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/Catalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/Catalog.java
@@ -52,10 +52,12 @@ public interface Catalog extends AutoCloseable {
     String SYSTEM_TABLE_SPLITTER = "$";
     String SYSTEM_DATABASE_NAME = "sys";
     String SYSTEM_BRANCH_PREFIX = "branch_";
-    String COMMENT_PROP = "comment";
     String TABLE_DEFAULT_OPTION_PREFIX = "table-default.";
-    String DB_LOCATION_PROP = "location";
     String DB_SUFFIX = ".db";
+
+    String COMMENT_PROP = "comment";
+    String OWNER_PROP = "owner";
+    String DB_LOCATION_PROP = "location";
     String NUM_ROWS_PROP = "numRows";
     String NUM_FILES_PROP = "numFiles";
     String TOTAL_SIZE_PROP = "totalSize";
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 8b8b62934dbdb..eed0fdb9bff14 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -283,6 +283,8 @@ private Database convertToHiveDatabase(String name, Map<String, String> properti
                 (key, value) -> {
                     if (key.equals(COMMENT_PROP)) {
                         database.setDescription(value);
+                    } else if (key.equals(OWNER_PROP)) {
+                        database.setOwnerName(value);
                     } else if (key.equals(DB_LOCATION_PROP)) {
                         database.setLocationUri(value);
                     } else if (value != null) {
@@ -299,12 +301,15 @@ public org.apache.paimon.catalog.Database getDatabaseImpl(String name)
         try {
             Database database = clients.run(client -> client.getDatabase(name));
             Map<String, String> options = new HashMap<>(database.getParameters());
-            if (database.getLocationUri() != null) {
-                options.put(DB_LOCATION_PROP, database.getLocationUri());
-            }
             if (database.getDescription() != null) {
                 options.put(COMMENT_PROP, database.getDescription());
             }
+            if (database.getOwnerName() != null) {
+                options.put(OWNER_PROP, database.getOwnerName());
+            }
+            if (database.getLocationUri() != null) {
+                options.put(DB_LOCATION_PROP, database.getLocationUri());
+            }
             return org.apache.paimon.catalog.Database.of(name, options, database.getDescription());
         } catch (NoSuchObjectException e) {
             throw new DatabaseNotExistException(name);
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index 7478f9628cfbf..33b993160dfd7 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -189,6 +189,7 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
           val props = getDatabaseProps("paimon_db")
           Assertions.assertEquals(props("k1"), "v1")
           Assertions.assertEquals(props("k2"), "v2")
+          Assertions.assertTrue(getDatabaseOwner("paimon_db").nonEmpty)
         }
     }
   }
@@ -296,29 +297,23 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
     }
   }
 
-  def getDatabaseLocation(dbName: String): String = {
+  def getDatabaseProp(dbName: String, propertyName: String): String = {
     spark
-      .sql(s"DESC DATABASE $dbName")
-      .filter("info_name == 'Location'")
+      .sql(s"DESC DATABASE EXTENDED $dbName")
+      .filter(s"info_name == '$propertyName'")
       .head()
       .getAs[String]("info_value")
-      .split(":")(1)
   }
 
-  def getDatabaseComment(dbName: String): String = {
-    spark
-      .sql(s"DESC DATABASE $dbName")
-      .filter("info_name == 'Comment'")
-      .head()
-      .getAs[String]("info_value")
-  }
+  def getDatabaseLocation(dbName: String): String =
+    getDatabaseProp(dbName, "Location").split(":")(1)
+
+  def getDatabaseComment(dbName: String): String = getDatabaseProp(dbName, "Comment")
+
+  def getDatabaseOwner(dbName: String): String = getDatabaseProp(dbName, "Owner")
 
   def getDatabaseProps(dbName: String): Map[String, String] = {
-    val dbPropsStr = spark
-      .sql(s"DESC DATABASE EXTENDED $dbName")
-      .filter("info_name == 'Properties'")
-      .head()
-      .getAs[String]("info_value")
+    val dbPropsStr = getDatabaseProp(dbName, "Properties")
     val pattern = "\\(([^,]+),([^)]+)\\)".r
     pattern
       .findAllIn(dbPropsStr.drop(1).dropRight(1))

From 19d7f66a006d02ee3ad233937fc6116a07acefbb Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Tue, 19 Nov 2024 11:02:16 +0800
Subject: [PATCH 028/157] [spark] Introduce View Support to SparkCatalog
 (#4538)

---
 .../RewritePaimonViewCommands.scala           |  80 ++++++++++++
 .../paimon/spark/sql/PaimonViewTest.scala     |  21 ++++
 .../RewritePaimonViewCommands.scala           |  79 ++++++++++++
 .../paimon/spark/sql/PaimonViewTest.scala     |  21 ++++
 .../paimon/spark/sql/PaimonViewTest.scala     |  21 ++++
 .../paimon/spark/sql/PaimonViewTest.scala     |  21 ++++
 .../paimon/spark/sql/PaimonViewTest.scala     |  21 ++++
 .../org/apache/paimon/spark/SparkCatalog.java |  49 ++------
 .../apache/paimon/spark/SparkTypeUtils.java   |   4 +
 .../paimon/spark/catalog/SupportView.java     |  86 +++++++++++++
 .../paimon/spark/utils/CatalogUtils.java      |  41 ++++++
 .../analysis/PaimonViewResolver.scala         |  85 +++++++++++++
 .../plans/logical/PaimonViewCommand.scala     |  74 +++++++++++
 .../spark/execution/PaimonStrategy.scala      |  37 +++++-
 .../spark/execution/PaimonViewExec.scala      | 117 ++++++++++++++++++
 .../PaimonSparkSessionExtensions.scala        |   3 +-
 .../paimon/spark/leafnode/package.scala       |   7 +-
 .../PaimonSparkSqlExtensionsParser.scala      |   4 +-
 .../PaimonSqlExtensionsAstBuilder.scala       |  13 +-
 .../RewritePaimonViewCommands.scala           |  77 ++++++++++++
 .../sql/DDLWithHiveCatalogTestBase.scala      |   4 +-
 .../paimon/spark/sql/PaimonViewTestBase.scala |  96 ++++++++++++++
 22 files changed, 914 insertions(+), 47 deletions(-)
 create mode 100644 paimon-spark/paimon-spark-3.2/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
 create mode 100644 paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
 create mode 100644 paimon-spark/paimon-spark-3.3/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
 create mode 100644 paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
 create mode 100644 paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
 create mode 100644 paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
 create mode 100644 paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/catalog/SupportView.java
 create mode 100644 paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/utils/CatalogUtils.java
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonViewCommand.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala

diff --git a/paimon-spark/paimon-spark-3.2/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala b/paimon-spark/paimon-spark-3.2/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
new file mode 100644
index 0000000000000..e759edd0c2c69
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.2/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
@@ -0,0 +1,80 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.parser.extensions
+
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.catalyst.plans.logical.{CreatePaimonView, DropPaimonView, ResolvedIdentifier, ShowPaimonViews}
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.analysis.{CTESubstitution, ResolvedNamespace, UnresolvedView}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.connector.catalog.{CatalogManager, LookupCatalog}
+
+case class RewritePaimonViewCommands(spark: SparkSession)
+  extends Rule[LogicalPlan]
+  with LookupCatalog {
+
+  protected lazy val catalogManager: CatalogManager = spark.sessionState.catalogManager
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsUp {
+
+    case CreateViewStatement(
+          ResolvedIdent(resolved),
+          userSpecifiedColumns,
+          comment,
+          properties,
+          Some(originalText),
+          child,
+          allowExisting,
+          replace,
+          _) =>
+      CreatePaimonView(
+        child = resolved,
+        queryText = originalText,
+        query = CTESubstitution.apply(child),
+        columnAliases = userSpecifiedColumns.map(_._1),
+        columnComments = userSpecifiedColumns.map(_._2.orElse(Option.empty)),
+        comment = comment,
+        properties = properties,
+        allowExisting = allowExisting,
+        replace = replace
+      )
+
+    case DropView(ResolvedIdent(resolved), ifExists: Boolean) =>
+      DropPaimonView(resolved, ifExists)
+
+    case ShowViews(_, pattern, output) if catalogManager.currentCatalog.isInstanceOf[SupportView] =>
+      ShowPaimonViews(
+        ResolvedNamespace(catalogManager.currentCatalog, catalogManager.currentNamespace),
+        pattern,
+        output)
+  }
+
+  private object ResolvedIdent {
+    def unapply(unresolved: Any): Option[ResolvedIdentifier] = unresolved match {
+      case CatalogAndIdentifier(viewCatalog: SupportView, ident) =>
+        Some(ResolvedIdentifier(viewCatalog, ident))
+      case UnresolvedView(CatalogAndIdentifier(viewCatalog: SupportView, ident), _, _, _) =>
+        Some(ResolvedIdentifier(viewCatalog, ident))
+      case _ =>
+        None
+    }
+  }
+}
diff --git a/paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala b/paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
new file mode 100644
index 0000000000000..6ab8a2671b518
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
@@ -0,0 +1,21 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+class PaimonViewTest extends PaimonViewTestBase {}
diff --git a/paimon-spark/paimon-spark-3.3/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala b/paimon-spark/paimon-spark-3.3/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
new file mode 100644
index 0000000000000..5d57cda2f34b2
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.3/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
@@ -0,0 +1,79 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.parser.extensions
+
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.catalyst.plans.logical.{CreatePaimonView, DropPaimonView, ResolvedIdentifier, ShowPaimonViews}
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.analysis.{CTESubstitution, ResolvedNamespace, UnresolvedDBObjectName, UnresolvedView}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.connector.catalog.{CatalogManager, LookupCatalog}
+
+case class RewritePaimonViewCommands(spark: SparkSession)
+  extends Rule[LogicalPlan]
+  with LookupCatalog {
+
+  protected lazy val catalogManager: CatalogManager = spark.sessionState.catalogManager
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsUp {
+
+    case CreateView(
+          ResolvedIdent(resolved),
+          userSpecifiedColumns,
+          comment,
+          properties,
+          Some(queryText),
+          query,
+          allowExisting,
+          replace) =>
+      CreatePaimonView(
+        child = resolved,
+        queryText = queryText,
+        query = CTESubstitution.apply(query),
+        columnAliases = userSpecifiedColumns.map(_._1),
+        columnComments = userSpecifiedColumns.map(_._2.orElse(Option.empty)),
+        comment = comment,
+        properties = properties,
+        allowExisting = allowExisting,
+        replace = replace
+      )
+
+    case DropView(ResolvedIdent(resolved), ifExists: Boolean) =>
+      DropPaimonView(resolved, ifExists)
+
+    case ShowViews(_, pattern, output) if catalogManager.currentCatalog.isInstanceOf[SupportView] =>
+      ShowPaimonViews(
+        ResolvedNamespace(catalogManager.currentCatalog, catalogManager.currentNamespace),
+        pattern,
+        output)
+  }
+
+  private object ResolvedIdent {
+    def unapply(unresolved: Any): Option[ResolvedIdentifier] = unresolved match {
+      case UnresolvedDBObjectName(CatalogAndIdentifier(viewCatalog: SupportView, ident), _) =>
+        Some(ResolvedIdentifier(viewCatalog, ident))
+      case UnresolvedView(CatalogAndIdentifier(viewCatalog: SupportView, ident), _, _, _) =>
+        Some(ResolvedIdentifier(viewCatalog, ident))
+      case _ =>
+        None
+    }
+  }
+}
diff --git a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
new file mode 100644
index 0000000000000..6ab8a2671b518
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
@@ -0,0 +1,21 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+class PaimonViewTest extends PaimonViewTestBase {}
diff --git a/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala b/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
new file mode 100644
index 0000000000000..6ab8a2671b518
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
@@ -0,0 +1,21 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+class PaimonViewTest extends PaimonViewTestBase {}
diff --git a/paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala b/paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
new file mode 100644
index 0000000000000..6ab8a2671b518
--- /dev/null
+++ b/paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
@@ -0,0 +1,21 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+class PaimonViewTest extends PaimonViewTestBase {}
diff --git a/paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala b/paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
new file mode 100644
index 0000000000000..6ab8a2671b518
--- /dev/null
+++ b/paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTest.scala
@@ -0,0 +1,21 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+class PaimonViewTest extends PaimonViewTestBase {}
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
index 89448c1f4310a..3b9af1694eef7 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
@@ -27,6 +27,7 @@
 import org.apache.paimon.schema.SchemaChange;
 import org.apache.paimon.spark.catalog.SparkBaseCatalog;
 import org.apache.paimon.spark.catalog.SupportFunction;
+import org.apache.paimon.spark.catalog.SupportView;
 import org.apache.paimon.table.FormatTable;
 import org.apache.paimon.table.FormatTableOptions;
 
@@ -72,10 +73,12 @@
 import static org.apache.paimon.spark.SparkCatalogOptions.DEFAULT_DATABASE;
 import static org.apache.paimon.spark.SparkTypeUtils.toPaimonType;
 import static org.apache.paimon.spark.util.OptionUtils.copyWithSQLConf;
+import static org.apache.paimon.spark.utils.CatalogUtils.checkNamespace;
+import static org.apache.paimon.spark.utils.CatalogUtils.toIdentifier;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
 
 /** Spark {@link TableCatalog} for paimon. */
-public class SparkCatalog extends SparkBaseCatalog implements SupportFunction {
+public class SparkCatalog extends SparkBaseCatalog implements SupportFunction, SupportView {
 
     private static final Logger LOG = LoggerFactory.getLogger(SparkCatalog.class);
 
@@ -126,10 +129,7 @@ public String[] defaultNamespace() {
     @Override
     public void createNamespace(String[] namespace, Map<String, String> metadata)
             throws NamespaceAlreadyExistsException {
-        checkArgument(
-                isValidateNamespace(namespace),
-                "Namespace %s is not valid",
-                Arrays.toString(namespace));
+        checkNamespace(namespace);
         try {
             catalog.createDatabase(namespace[0], false, metadata);
         } catch (Catalog.DatabaseAlreadyExistException e) {
@@ -152,9 +152,7 @@ public String[][] listNamespaces(String[] namespace) throws NoSuchNamespaceExcep
         if (namespace.length == 0) {
             return listNamespaces();
         }
-        if (!isValidateNamespace(namespace)) {
-            throw new NoSuchNamespaceException(namespace);
-        }
+        checkNamespace(namespace);
         try {
             catalog.getDatabase(namespace[0]);
             return new String[0][];
@@ -166,10 +164,7 @@ public String[][] listNamespaces(String[] namespace) throws NoSuchNamespaceExcep
     @Override
     public Map<String, String> loadNamespaceMetadata(String[] namespace)
             throws NoSuchNamespaceException {
-        checkArgument(
-                isValidateNamespace(namespace),
-                "Namespace %s is not valid",
-                Arrays.toString(namespace));
+        checkNamespace(namespace);
         String dataBaseName = namespace[0];
         try {
             return catalog.getDatabase(dataBaseName).options();
@@ -207,10 +202,7 @@ public boolean dropNamespace(String[] namespace) throws NoSuchNamespaceException
      */
     public boolean dropNamespace(String[] namespace, boolean cascade)
             throws NoSuchNamespaceException {
-        checkArgument(
-                isValidateNamespace(namespace),
-                "Namespace %s is not valid",
-                Arrays.toString(namespace));
+        checkNamespace(namespace);
         try {
             catalog.dropDatabase(namespace[0], false, cascade);
             return true;
@@ -224,10 +216,7 @@ public boolean dropNamespace(String[] namespace, boolean cascade)
 
     @Override
     public Identifier[] listTables(String[] namespace) throws NoSuchNamespaceException {
-        checkArgument(
-                isValidateNamespace(namespace),
-                "Missing database in namespace: %s",
-                Arrays.toString(namespace));
+        checkNamespace(namespace);
         try {
             return catalog.listTables(namespace[0]).stream()
                     .map(table -> Identifier.of(namespace, table))
@@ -239,10 +228,7 @@ public Identifier[] listTables(String[] namespace) throws NoSuchNamespaceExcepti
 
     @Override
     public void invalidateTable(Identifier ident) {
-        try {
-            catalog.invalidateTable(toIdentifier(ident));
-        } catch (NoSuchTableException ignored) {
-        }
+        catalog.invalidateTable(toIdentifier(ident));
     }
 
     @Override
@@ -347,7 +333,7 @@ public boolean dropTable(Identifier ident) {
         try {
             catalog.dropTable(toIdentifier(ident), false);
             return true;
-        } catch (Catalog.TableNotExistException | NoSuchTableException e) {
+        } catch (Catalog.TableNotExistException e) {
             return false;
         }
     }
@@ -454,10 +440,6 @@ private void validateAlterProperty(String alterKey) {
         }
     }
 
-    private boolean isValidateNamespace(String[] namespace) {
-        return namespace.length == 1;
-    }
-
     @Override
     public void renameTable(Identifier oldIdent, Identifier newIdent)
             throws NoSuchTableException, TableAlreadyExistsException {
@@ -472,15 +454,6 @@ public void renameTable(Identifier oldIdent, Identifier newIdent)
 
     // --------------------- tools ------------------------------------------
 
-    protected org.apache.paimon.catalog.Identifier toIdentifier(Identifier ident)
-            throws NoSuchTableException {
-        if (!isValidateNamespace(ident.namespace())) {
-            throw new NoSuchTableException(ident);
-        }
-
-        return new org.apache.paimon.catalog.Identifier(ident.namespace()[0], ident.name());
-    }
-
     protected org.apache.spark.sql.connector.catalog.Table loadSparkTable(
             Identifier ident, Map<String, String> extraOptions) throws NoSuchTableException {
         try {
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkTypeUtils.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkTypeUtils.java
index 8bba676200ce7..f6643f7584065 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkTypeUtils.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkTypeUtils.java
@@ -81,6 +81,10 @@ public static DataType fromPaimonType(org.apache.paimon.types.DataType type) {
         return type.accept(PaimonToSparkTypeVisitor.INSTANCE);
     }
 
+    public static org.apache.paimon.types.RowType toPaimonRowType(StructType type) {
+        return (RowType) toPaimonType(type);
+    }
+
     public static org.apache.paimon.types.DataType toPaimonType(DataType dataType) {
         return SparkToPaimonTypeVisitor.visit(dataType);
     }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/catalog/SupportView.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/catalog/SupportView.java
new file mode 100644
index 0000000000000..b8ce86e892866
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/catalog/SupportView.java
@@ -0,0 +1,86 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalog;
+
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.spark.SparkTypeUtils;
+import org.apache.paimon.view.View;
+import org.apache.paimon.view.ViewImpl;
+
+import org.apache.spark.sql.catalyst.analysis.NoSuchNamespaceException;
+import org.apache.spark.sql.connector.catalog.Identifier;
+import org.apache.spark.sql.types.StructType;
+
+import java.util.List;
+import java.util.Map;
+
+import static org.apache.paimon.spark.utils.CatalogUtils.checkNamespace;
+import static org.apache.paimon.spark.utils.CatalogUtils.toIdentifier;
+
+/** Catalog methods for working with Views. */
+public interface SupportView extends WithPaimonCatalog {
+
+    default List<String> listViews(String[] namespace) throws NoSuchNamespaceException {
+        try {
+            checkNamespace(namespace);
+            return paimonCatalog().listViews(namespace[0]);
+        } catch (Catalog.DatabaseNotExistException e) {
+            throw new NoSuchNamespaceException(namespace);
+        }
+    }
+
+    default View loadView(Identifier ident) throws Catalog.ViewNotExistException {
+        return paimonCatalog().getView(toIdentifier(ident));
+    }
+
+    default void createView(
+            Identifier ident,
+            StructType schema,
+            String queryText,
+            String comment,
+            Map<String, String> properties,
+            Boolean ignoreIfExists)
+            throws NoSuchNamespaceException {
+        org.apache.paimon.catalog.Identifier paimonIdent = toIdentifier(ident);
+        try {
+            paimonCatalog()
+                    .createView(
+                            paimonIdent,
+                            new ViewImpl(
+                                    paimonIdent,
+                                    SparkTypeUtils.toPaimonRowType(schema),
+                                    queryText,
+                                    comment,
+                                    properties),
+                            ignoreIfExists);
+        } catch (Catalog.ViewAlreadyExistException e) {
+            throw new RuntimeException("view already exists: " + ident, e);
+        } catch (Catalog.DatabaseNotExistException e) {
+            throw new NoSuchNamespaceException(ident.namespace());
+        }
+    }
+
+    default void dropView(Identifier ident, Boolean ignoreIfExists) {
+        try {
+            paimonCatalog().dropView(toIdentifier(ident), ignoreIfExists);
+        } catch (Catalog.ViewNotExistException e) {
+            throw new RuntimeException("view not exists: " + ident, e);
+        }
+    }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/utils/CatalogUtils.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/utils/CatalogUtils.java
new file mode 100644
index 0000000000000..fca9df210e708
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/utils/CatalogUtils.java
@@ -0,0 +1,41 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.utils;
+
+import org.apache.spark.sql.connector.catalog.Identifier;
+
+import java.util.Arrays;
+
+import static org.apache.paimon.utils.Preconditions.checkArgument;
+
+/** Utils of catalog. */
+public class CatalogUtils {
+
+    public static void checkNamespace(String[] namespace) {
+        checkArgument(
+                namespace.length == 1,
+                "Paimon only support single namespace, but got %s",
+                Arrays.toString(namespace));
+    }
+
+    public static org.apache.paimon.catalog.Identifier toIdentifier(Identifier ident) {
+        checkNamespace(ident.namespace());
+        return new org.apache.paimon.catalog.Identifier(ident.namespace()[0], ident.name());
+    }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
new file mode 100644
index 0000000000000..a375a296583ec
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
@@ -0,0 +1,85 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.analysis
+
+import org.apache.paimon.catalog.Catalog.ViewNotExistException
+import org.apache.paimon.spark.SparkTypeUtils
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.view.View
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.analysis.{GetColumnByOrdinal, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.expressions.{Alias, UpCast}
+import org.apache.spark.sql.catalyst.parser.ParseException
+import org.apache.spark.sql.catalyst.parser.extensions.{CurrentOrigin, Origin}
+import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, Project, SubqueryAlias}
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.connector.catalog.PaimonLookupCatalog
+
+case class PaimonViewResolver(spark: SparkSession)
+  extends Rule[LogicalPlan]
+  with PaimonLookupCatalog {
+
+  protected lazy val catalogManager = spark.sessionState.catalogManager
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperators {
+    case u @ UnresolvedRelation(parts @ CatalogAndIdentifier(catalog: SupportView, ident), _, _) =>
+      try {
+        val view = catalog.loadView(ident)
+        createViewRelation(parts, view)
+      } catch {
+        case _: ViewNotExistException =>
+          u
+      }
+  }
+
+  private def createViewRelation(nameParts: Seq[String], view: View): LogicalPlan = {
+    val parsedPlan = parseViewText(nameParts.toArray.mkString("."), view.query)
+
+    val aliases = SparkTypeUtils.fromPaimonRowType(view.rowType()).fields.zipWithIndex.map {
+      case (expected, pos) =>
+        val attr = GetColumnByOrdinal(pos, expected.dataType)
+        Alias(UpCast(attr, expected.dataType), expected.name)(explicitMetadata =
+          Some(expected.metadata))
+    }
+
+    SubqueryAlias(nameParts, Project(aliases, parsedPlan))
+  }
+
+  private def parseViewText(name: String, viewText: String): LogicalPlan = {
+    val origin = Origin(
+      objectType = Some("VIEW"),
+      objectName = Some(name)
+    )
+    try {
+      CurrentOrigin.withOrigin(origin) {
+        try {
+          spark.sessionState.sqlParser.parseQuery(viewText)
+        } catch {
+          // For compatibility with Spark 3.2 and below
+          case _: NoSuchMethodError =>
+            spark.sessionState.sqlParser.parsePlan(viewText)
+        }
+      }
+    } catch {
+      case _: ParseException =>
+        throw new RuntimeException("Failed to parse view text: " + viewText)
+    }
+  }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonViewCommand.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonViewCommand.scala
new file mode 100644
index 0000000000000..24b27bb0e6cca
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonViewCommand.scala
@@ -0,0 +1,74 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.plans.logical
+
+import org.apache.paimon.spark.leafnode.{PaimonBinaryCommand, PaimonUnaryCommand}
+
+import org.apache.spark.sql.catalyst.expressions.Attribute
+import org.apache.spark.sql.catalyst.plans.logical.{LeafNode, LogicalPlan, ShowViews, Statistics}
+import org.apache.spark.sql.connector.catalog.{CatalogPlugin, Identifier}
+
+case class CreatePaimonView(
+    child: LogicalPlan,
+    queryText: String,
+    query: LogicalPlan,
+    columnAliases: Seq[String],
+    columnComments: Seq[Option[String]],
+    queryColumnNames: Seq[String] = Seq.empty,
+    comment: Option[String],
+    properties: Map[String, String],
+    allowExisting: Boolean,
+    replace: Boolean)
+  extends PaimonBinaryCommand {
+
+  override def left: LogicalPlan = child
+
+  override def right: LogicalPlan = query
+
+  override protected def withNewChildrenInternal(
+      newLeft: LogicalPlan,
+      newRight: LogicalPlan): LogicalPlan =
+    copy(child = newLeft, query = newRight)
+}
+
+case class DropPaimonView(child: LogicalPlan, ifExists: Boolean) extends PaimonUnaryCommand {
+
+  override protected def withNewChildInternal(newChild: LogicalPlan): DropPaimonView =
+    copy(child = newChild)
+}
+
+case class ShowPaimonViews(
+    namespace: LogicalPlan,
+    pattern: Option[String],
+    override val output: Seq[Attribute] = ShowViews.getOutputAttrs)
+  extends PaimonUnaryCommand {
+
+  override def child: LogicalPlan = namespace
+
+  override protected def withNewChildInternal(newChild: LogicalPlan): ShowPaimonViews =
+    copy(namespace = newChild)
+}
+
+/** Copy from spark 3.4+ */
+case class ResolvedIdentifier(catalog: CatalogPlugin, identifier: Identifier) extends LeafNode {
+
+  override def output: Seq[Attribute] = Nil
+
+  override def stats: Statistics = Statistics.DUMMY
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
index 0c3d3e6b6dc64..0c3865f7d979a 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
@@ -19,10 +19,12 @@
 package org.apache.paimon.spark.execution
 
 import org.apache.paimon.spark.{SparkCatalog, SparkUtils}
-import org.apache.paimon.spark.catalyst.plans.logical.{CreateOrReplaceTagCommand, DeleteTagCommand, PaimonCallCommand, RenameTagCommand, ShowTagsCommand}
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.catalyst.plans.logical.{CreateOrReplaceTagCommand, CreatePaimonView, DeleteTagCommand, DropPaimonView, PaimonCallCommand, RenameTagCommand, ResolvedIdentifier, ShowPaimonViews, ShowTagsCommand}
 
 import org.apache.spark.sql.{SparkSession, Strategy}
 import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.analysis.ResolvedNamespace
 import org.apache.spark.sql.catalyst.expressions.{Expression, GenericInternalRow, PredicateHelper}
 import org.apache.spark.sql.catalyst.plans.logical.{CreateTableAsSelect, LogicalPlan}
 import org.apache.spark.sql.connector.catalog.{Identifier, PaimonLookupCatalog, TableCatalog}
@@ -65,6 +67,39 @@ case class PaimonStrategy(spark: SparkSession)
     case RenameTagCommand(PaimonCatalogAndIdentifier(catalog, ident), sourceTag, targetTag) =>
       RenameTagExec(catalog, ident, sourceTag, targetTag) :: Nil
 
+    case CreatePaimonView(
+          ResolvedIdentifier(viewCatalog: SupportView, ident),
+          queryText,
+          query,
+          columnAliases,
+          columnComments,
+          queryColumnNames,
+          comment,
+          properties,
+          allowExisting,
+          replace) =>
+      CreatePaimonViewExec(
+        viewCatalog,
+        ident,
+        queryText,
+        query.schema,
+        columnAliases,
+        columnComments,
+        queryColumnNames,
+        comment,
+        properties,
+        allowExisting,
+        replace) :: Nil
+
+    case DropPaimonView(ResolvedIdentifier(viewCatalog: SupportView, ident), ifExists) =>
+      DropPaimonViewExec(viewCatalog, ident, ifExists) :: Nil
+
+    // A new member was added to ResolvedNamespace since spark4.0,
+    // unapply pattern matching is not used here to ensure compatibility across multiple spark versions.
+    case ShowPaimonViews(r: ResolvedNamespace, pattern, output)
+        if r.catalog.isInstanceOf[SupportView] =>
+      ShowPaimonViewsExec(output, r.catalog.asInstanceOf[SupportView], r.namespace, pattern) :: Nil
+
     case _ => Nil
   }
 
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
new file mode 100644
index 0000000000000..7a4b907c72f12
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
@@ -0,0 +1,117 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.execution
+
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.leafnode.PaimonLeafV2CommandExec
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.expressions.{Attribute, GenericInternalRow}
+import org.apache.spark.sql.catalyst.util.StringUtils
+import org.apache.spark.sql.connector.catalog.Identifier
+import org.apache.spark.sql.types.StructType
+import org.apache.spark.unsafe.types.UTF8String
+
+import scala.collection.JavaConverters._
+import scala.collection.mutable.ArrayBuffer
+
+case class CreatePaimonViewExec(
+    catalog: SupportView,
+    ident: Identifier,
+    queryText: String,
+    viewSchema: StructType,
+    columnAliases: Seq[String],
+    columnComments: Seq[Option[String]],
+    queryColumnNames: Seq[String],
+    comment: Option[String],
+    properties: Map[String, String],
+    allowExisting: Boolean,
+    replace: Boolean
+) extends PaimonLeafV2CommandExec {
+
+  override def output: Seq[Attribute] = Nil
+
+  override protected def run(): Seq[InternalRow] = {
+    if (columnAliases.nonEmpty || columnComments.nonEmpty || queryColumnNames.nonEmpty) {
+      throw new UnsupportedOperationException(
+        "columnAliases, columnComments and queryColumnNames are not supported now")
+    }
+
+    // Note: for replace just drop then create ,this operation is non-atomic.
+    if (replace) {
+      catalog.dropView(ident, true)
+    }
+
+    catalog.createView(
+      ident,
+      viewSchema,
+      queryText,
+      comment.orNull,
+      properties.asJava,
+      allowExisting)
+
+    Nil
+  }
+
+  override def simpleString(maxFields: Int): String = {
+    s"CreatePaimonViewExec: $ident"
+  }
+}
+
+case class DropPaimonViewExec(catalog: SupportView, ident: Identifier, ifExists: Boolean)
+  extends PaimonLeafV2CommandExec {
+
+  override lazy val output: Seq[Attribute] = Nil
+
+  override protected def run(): Seq[InternalRow] = {
+    catalog.dropView(ident, ifExists)
+    Nil
+  }
+
+  override def simpleString(maxFields: Int): String = {
+    s"DropPaimonViewExec: $ident"
+  }
+}
+
+case class ShowPaimonViewsExec(
+    output: Seq[Attribute],
+    catalog: SupportView,
+    namespace: Seq[String],
+    pattern: Option[String])
+  extends PaimonLeafV2CommandExec {
+
+  override protected def run(): Seq[InternalRow] = {
+    val rows = new ArrayBuffer[InternalRow]()
+    catalog.listViews(namespace.toArray).asScala.map {
+      viewName =>
+        if (pattern.forall(StringUtils.filterPattern(Seq(viewName), _).nonEmpty)) {
+          rows += new GenericInternalRow(
+            Array(
+              UTF8String.fromString(namespace.mkString(".")),
+              UTF8String.fromString(viewName),
+              false))
+        }
+    }
+    rows.toSeq
+  }
+
+  override def simpleString(maxFields: Int): String = {
+    s"ShowPaimonViewsExec: $namespace"
+  }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
index 4fe217ee09bd8..6f47a77ef3080 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
@@ -18,7 +18,7 @@
 
 package org.apache.paimon.spark.extensions
 
-import org.apache.paimon.spark.catalyst.analysis.{PaimonAnalysis, PaimonDeleteTable, PaimonIncompatiblePHRRules, PaimonIncompatibleResolutionRules, PaimonMergeInto, PaimonPostHocResolutionRules, PaimonProcedureResolver, PaimonUpdateTable}
+import org.apache.paimon.spark.catalyst.analysis.{PaimonAnalysis, PaimonDeleteTable, PaimonIncompatiblePHRRules, PaimonIncompatibleResolutionRules, PaimonMergeInto, PaimonPostHocResolutionRules, PaimonProcedureResolver, PaimonUpdateTable, PaimonViewResolver}
 import org.apache.paimon.spark.catalyst.optimizer.{EvalSubqueriesForDeleteTable, MergePaimonScalarSubqueries}
 import org.apache.paimon.spark.catalyst.plans.logical.PaimonTableValuedFunctions
 import org.apache.paimon.spark.execution.PaimonStrategy
@@ -37,6 +37,7 @@ class PaimonSparkSessionExtensions extends (SparkSessionExtensions => Unit) {
     // analyzer extensions
     extensions.injectResolutionRule(spark => new PaimonAnalysis(spark))
     extensions.injectResolutionRule(spark => PaimonProcedureResolver(spark))
+    extensions.injectResolutionRule(spark => PaimonViewResolver(spark))
     extensions.injectResolutionRule(spark => PaimonIncompatibleResolutionRules(spark))
 
     extensions.injectPostHocResolutionRule(spark => PaimonPostHocResolutionRules(spark))
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/leafnode/package.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/leafnode/package.scala
index 5befb88dae43f..6ebab038480a4 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/leafnode/package.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/leafnode/package.scala
@@ -18,7 +18,7 @@
 
 package org.apache.paimon.spark
 
-import org.apache.spark.sql.catalyst.plans.logical.{LeafCommand, LeafParsedStatement}
+import org.apache.spark.sql.catalyst.plans.logical.{BinaryCommand, LeafCommand, LeafParsedStatement, UnaryCommand}
 import org.apache.spark.sql.execution.command.LeafRunnableCommand
 import org.apache.spark.sql.execution.datasources.v2.LeafV2CommandExec
 
@@ -30,6 +30,9 @@ package object leafnode {
 
   trait PaimonLeafCommand extends LeafCommand
 
-  trait PaimonLeafV2CommandExec extends LeafV2CommandExec
+  trait PaimonUnaryCommand extends UnaryCommand
+
+  trait PaimonBinaryCommand extends BinaryCommand
 
+  trait PaimonLeafV2CommandExec extends LeafV2CommandExec
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala
index dd0a48159b2ae..9ece186930d71 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala
@@ -23,7 +23,7 @@ import org.antlr.v4.runtime.atn.PredictionMode
 import org.antlr.v4.runtime.misc.{Interval, ParseCancellationException}
 import org.antlr.v4.runtime.tree.TerminalNodeImpl
 import org.apache.spark.internal.Logging
-import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.{AnalysisException, SparkSession}
 import org.apache.spark.sql.catalyst.{FunctionIdentifier, TableIdentifier}
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.parser.{ParseException, ParserInterface}
@@ -61,7 +61,7 @@ class PaimonSparkSqlExtensionsParser(val delegate: ParserInterface)
       parse(sqlTextAfterSubstitution)(parser => astBuilder.visit(parser.singleStatement()))
         .asInstanceOf[LogicalPlan]
     } else {
-      delegate.parsePlan(sqlText)
+      RewritePaimonViewCommands(SparkSession.active).apply(delegate.parsePlan(sqlText))
     }
   }
 
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSqlExtensionsAstBuilder.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSqlExtensionsAstBuilder.scala
index b864894e7498c..a1289a5f0b50f 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSqlExtensionsAstBuilder.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSqlExtensionsAstBuilder.scala
@@ -19,7 +19,7 @@
 package org.apache.spark.sql.catalyst.parser.extensions
 
 import org.apache.paimon.spark.catalyst.plans.logical
-import org.apache.paimon.spark.catalyst.plans.logical.{CreateOrReplaceTagCommand, DeleteTagCommand, PaimonCallArgument, PaimonCallStatement, PaimonNamedArgument, PaimonPositionalArgument, RenameTagCommand, ShowTagsCommand, TagOptions}
+import org.apache.paimon.spark.catalyst.plans.logical._
 import org.apache.paimon.utils.TimeUtils
 
 import org.antlr.v4.runtime._
@@ -212,5 +212,16 @@ object CurrentOrigin {
   def get: Origin = value.get()
   def set(o: Origin): Unit = value.set(o)
   def reset(): Unit = value.set(Origin())
+
+  def withOrigin[A](o: Origin)(f: => A): A = {
+    // remember the previous one so it can be reset to this
+    // way withOrigin can be recursive
+    val previous = get
+    set(o)
+    val ret =
+      try f
+      finally { set(previous) }
+    ret
+  }
 }
 /* Apache Spark copy end */
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
new file mode 100644
index 0000000000000..f69e5d92038ed
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/RewritePaimonViewCommands.scala
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.parser.extensions
+
+import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.catalyst.plans.logical.{CreatePaimonView, DropPaimonView, ResolvedIdentifier, ShowPaimonViews}
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.analysis.{CTESubstitution, ResolvedNamespace, UnresolvedIdentifier}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.connector.catalog.{CatalogManager, LookupCatalog}
+
+case class RewritePaimonViewCommands(spark: SparkSession)
+  extends Rule[LogicalPlan]
+  with LookupCatalog {
+
+  protected lazy val catalogManager: CatalogManager = spark.sessionState.catalogManager
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsUp {
+
+    // A new member was added to CreatePaimonView since spark4.0,
+    // unapply pattern matching is not used here to ensure compatibility across multiple spark versions.
+    case c: CreateView =>
+      ResolvedIdent
+        .unapply(c.child)
+        .map {
+          resolved =>
+            CreatePaimonView(
+              child = resolved,
+              queryText = c.originalText.get,
+              query = CTESubstitution.apply(c.query),
+              columnAliases = c.userSpecifiedColumns.map(_._1),
+              columnComments = c.userSpecifiedColumns.map(_._2.orElse(None)),
+              comment = c.comment,
+              properties = c.properties,
+              allowExisting = c.allowExisting,
+              replace = c.replace
+            )
+        }
+        .getOrElse(c)
+
+    case DropView(ResolvedIdent(resolved), ifExists: Boolean) =>
+      DropPaimonView(resolved, ifExists)
+
+    case ShowViews(_, pattern, output) if catalogManager.currentCatalog.isInstanceOf[SupportView] =>
+      ShowPaimonViews(
+        ResolvedNamespace(catalogManager.currentCatalog, catalogManager.currentNamespace),
+        pattern,
+        output)
+  }
+
+  private object ResolvedIdent {
+    def unapply(unresolved: Any): Option[ResolvedIdentifier] = unresolved match {
+      case UnresolvedIdentifier(CatalogAndIdentifier(viewCatalog: SupportView, ident), _) =>
+        Some(ResolvedIdentifier(viewCatalog, ident))
+      case _ =>
+        None
+    }
+  }
+}
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index 33b993160dfd7..56922ae2aeff8 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -241,12 +241,12 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
           spark.sql(s"CREATE DATABASE paimon_db")
           spark.sql(s"USE paimon_db")
           spark.sql(s"CREATE TABLE paimon_tbl (id int, name string, dt string) using paimon")
-          // Currently, only spark_catalog supports create other table or view
+          // Only spark_catalog supports create other table
           if (catalogName.equals(sparkCatalogName)) {
             spark.sql(s"CREATE TABLE parquet_tbl (id int, name string, dt string) using parquet")
             spark.sql(s"CREATE VIEW parquet_tbl_view AS SELECT * FROM parquet_tbl")
-            spark.sql(s"CREATE VIEW paimon_tbl_view AS SELECT * FROM paimon_tbl")
           }
+          spark.sql(s"CREATE VIEW paimon_tbl_view AS SELECT * FROM paimon_tbl")
           spark.sql(s"USE default")
           spark.sql(s"DROP DATABASE paimon_db CASCADE")
       }
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
new file mode 100644
index 0000000000000..39ed8e8a769d3
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
@@ -0,0 +1,96 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.sql
+
+import org.apache.paimon.spark.PaimonHiveTestBase
+
+import org.apache.spark.sql.Row
+
+abstract class PaimonViewTestBase extends PaimonHiveTestBase {
+
+  test("Paimon View: create and drop view") {
+    Seq(sparkCatalogName, paimonHiveCatalogName).foreach {
+      catalogName =>
+        {
+          sql(s"USE $catalogName")
+          withDatabase("test_db") {
+            sql("CREATE DATABASE test_db")
+            sql("USE test_db")
+            withTable("t") {
+              withView("v1") {
+                sql("CREATE TABLE t (id INT) USING paimon")
+                sql("INSERT INTO t VALUES (1), (2)")
+
+                sql("CREATE VIEW v1 AS SELECT * FROM t")
+                checkAnswer(sql("SHOW VIEWS"), Seq(Row("test_db", "v1", false)))
+                checkAnswer(sql("SELECT * FROM v1"), Seq(Row(1), Row(2)))
+                checkAnswer(
+                  sql("SELECT * FROM v1 WHERE id >= (SELECT max(id) FROM v1)"),
+                  Seq(Row(2)))
+
+                // test drop view
+                sql("DROP VIEW IF EXISTS v1")
+                checkAnswer(sql("SHOW VIEWS"), Seq())
+                sql("CREATE VIEW v1 AS SELECT * FROM t WHERE id > 1")
+                checkAnswer(sql("SHOW VIEWS"), Seq(Row("test_db", "v1", false)))
+                checkAnswer(sql("SELECT * FROM v1"), Seq(Row(2)))
+
+                // test create or replace view
+                intercept[Exception] {
+                  sql("CREATE VIEW v1 AS SELECT * FROM t WHERE id < 2")
+                }
+                sql("CREATE OR REPLACE VIEW v1 AS SELECT * FROM t WHERE id < 2")
+                checkAnswer(sql("SELECT * FROM v1"), Seq(Row(1)))
+              }
+            }
+          }
+        }
+    }
+  }
+
+  test("Paimon View: show views") {
+    Seq(sparkCatalogName, paimonHiveCatalogName).foreach {
+      catalogName =>
+        {
+          sql(s"USE $catalogName")
+          withDatabase("test_db") {
+            sql("CREATE DATABASE test_db")
+            sql("USE test_db")
+            withTable("t") {
+              withView("va", "vab", "vc") {
+                sql("CREATE TABLE t (id INT) USING paimon")
+                sql("CREATE VIEW va AS SELECT * FROM t")
+                sql("CREATE VIEW vab AS SELECT * FROM t")
+                sql("CREATE VIEW vc AS SELECT * FROM t")
+                checkAnswer(
+                  sql("SHOW VIEWS"),
+                  Seq(
+                    Row("test_db", "va", false),
+                    Row("test_db", "vab", false),
+                    Row("test_db", "vc", false)))
+                checkAnswer(
+                  sql("SHOW VIEWS LIKE 'va*'"),
+                  Seq(Row("test_db", "va", false), Row("test_db", "vab", false)))
+              }
+            }
+          }
+        }
+    }
+  }
+}

From f09d9c200a6f2d1913e7f1f318b164205d226ac0 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 19 Nov 2024 11:20:56 +0800
Subject: [PATCH 029/157] [doc] Move system tables to concepts

---
 docs/content/concepts/spec/_index.md          |  2 +-
 .../system-tables.md                          | 87 ++++++++++---------
 docs/content/concepts/table-types.md          | 33 ++++++-
 docs/content/flink/savepoint.md               |  2 +-
 .../primary-key-table/query-performance.md    |  2 +-
 docs/content/primary-key-table/table-mode.md  |  2 +-
 6 files changed, 81 insertions(+), 47 deletions(-)
 rename docs/content/{maintenance => concepts}/system-tables.md (97%)

diff --git a/docs/content/concepts/spec/_index.md b/docs/content/concepts/spec/_index.md
index 166ce4eeaa549..ef5f03098e20d 100644
--- a/docs/content/concepts/spec/_index.md
+++ b/docs/content/concepts/spec/_index.md
@@ -1,7 +1,7 @@
 ---
 title: Specification
 bookCollapseSection: true
-weight: 6
+weight: 7
 ---
 <!--
 Licensed to the Apache Software Foundation (ASF) under one
diff --git a/docs/content/maintenance/system-tables.md b/docs/content/concepts/system-tables.md
similarity index 97%
rename from docs/content/maintenance/system-tables.md
rename to docs/content/concepts/system-tables.md
index 5ef5121c25a92..5795aea419fb3 100644
--- a/docs/content/maintenance/system-tables.md
+++ b/docs/content/concepts/system-tables.md
@@ -1,9 +1,9 @@
 ---
 title: "System Tables"
-weight: 2
+weight: 6
 type: docs
 aliases:
-- /maintenance/system-tables.html
+- /concepts/system-tables.html
 ---
 <!--
 Licensed to the Apache Software Foundation (ASF) under one
@@ -26,9 +26,15 @@ under the License.
 
 # System Tables
 
-## Table Specified System Table
+Paimon provides a very rich set of system tables to help users better analyze and query the status of Paimon tables:
 
-Table specified system tables contain metadata and information about each table, such as the snapshots created and the options in use. Users can access system tables with batch queries.
+1. Query the status of the data table: Data System Table.
+2. Query the global status of the entire Catalog: Global System Table.
+
+## Data System Table
+
+Data System tables contain metadata and information about each Paimon data table, such as the snapshots created and the
+options in use. Users can access system tables with batch queries.
 
 Currently, Flink, Spark, Trino and StarRocks support querying system tables.
 
@@ -130,6 +136,26 @@ SELECT * FROM my_table$audit_log;
 */
 ```
 
+### Binlog Table
+
+You can query the binlog through binlog table. In the binlog system table, the update before and update after will be packed in one row.
+
+```sql
+SELECT * FROM T$binlog;
+
+/*
++------------------+----------------------+-----------------------+
+|     rowkind      |       column_0       |       column_1        |
++------------------+----------------------+-----------------------+
+|        +I        |       [col_0]        |       [col_1]         |
++------------------+----------------------+-----------------------+
+|        +U        | [col_0_ub, col_0_ua] | [col_1_ub, col_1_ua]  |
++------------------+----------------------+-----------------------+
+|        -D        |       [col_0]        |       [col_1]         |
++------------------+----------------------+-----------------------+
+*/
+```
+
 ### Read-optimized Table
 
 If you require extreme reading performance and can accept reading slightly old data,
@@ -347,6 +373,22 @@ SELECT * FROM my_table$buckets;
 */
 ```
 
+### Statistic Table
+You can query the statistic information through statistic table.
+
+```sql
+SELECT * FROM T$statistics;
+
+/*
++--------------+------------+-----------------------+------------------+----------+
+|  snapshot_id |  schema_id |     mergedRecordCount | mergedRecordSize |  colstat |
++--------------+------------+-----------------------+------------------+----------+
+|            2 |          0 |              2        |         2        |    {}    |
++--------------+------------+-----------------------+------------------+----------+
+1 rows in set
+*/
+```
+
 ## Global System Table
 
 Global system tables contain the statistical information of all the tables exists in paimon. For convenient of searching, we create a reference system database called `sys`.
@@ -390,40 +432,3 @@ SELECT * FROM sys.catalog_options;
 1 rows in set
 */
 ```
-
-### Statistic Table
-You can query the statistic information through statistic table.
-
-```sql
-SELECT * FROM T$statistics;
-
-/*
-+--------------+------------+-----------------------+------------------+----------+
-|  snapshot_id |  schema_id |     mergedRecordCount | mergedRecordSize |  colstat |
-+--------------+------------+-----------------------+------------------+----------+
-|            2 |          0 |              2        |         2        |    {}    |
-+--------------+------------+-----------------------+------------------+----------+
-1 rows in set
-*/
-```
-### Binlog Table
-
-You can query the binlog through binlog table. In the binlog system table, the update before and update after will be packed in one row. 
-
-```sql
-SELECT * FROM T$binlog;
-
-/*
-+------------------+----------------------+-----------------------+
-|     rowkind      |       column_0       |       column_1        |
-+------------------+----------------------+-----------------------+
-|        +I        |       [col_0]        |       [col_1]         |
-+------------------+----------------------+-----------------------+
-|        +U        | [col_0_ub, col_0_ua] | [col_1_ub, col_1_ua]  |
-+------------------+----------------------+-----------------------+
-|        -D        |       [col_0]        |       [col_1]         |
-+------------------+----------------------+-----------------------+
-*/
-```
-
-
diff --git a/docs/content/concepts/table-types.md b/docs/content/concepts/table-types.md
index 0a1ef6481170a..58199031b6e7d 100644
--- a/docs/content/concepts/table-types.md
+++ b/docs/content/concepts/table-types.md
@@ -94,14 +94,43 @@ CREATE TABLE my_table (
 
 ## View
 
-View is supported when the metastore can support view, for example, hive metastore.
+View is supported when the metastore can support view, for example, hive metastore. If you don't have metastore, you
+can only use temporary View, which only exists in the current session. This chapter mainly describes persistent views.
 
 View will currently save the original SQL. If you need to use View across engines, you can write a cross engine
 SQL statement. For example:
 
+{{< tabs "view" >}}
+{{< tab "Flink SQL" >}}
+
 ```sql
-CREATE VIEW my_view AS SELECT a + 1, b FROM my_db.my_source;
+CREATE VIEW [IF NOT EXISTS] [catalog_name.][db_name.]view_name
+   [( columnName [, columnName ]* )] [COMMENT view_comment]
+AS query_expression;
+
+DROP VIEW  [IF EXISTS] [catalog_name.][db_name.]view_name;
+
+SHOW VIEWS;
+
+SHOW CREATE VIEW my_view;
 ```
+{{< /tab >}}
+
+{{< tab "Spark SQL" >}}
+
+```sql
+CREATE [OR REPLACE] VIEW [IF NOT EXISTS] [catalog_name.][db_name.]view_name
+   [( columnName [, columnName ]* )] [COMMENT view_comment]
+AS query_expression;
+
+DROP VIEW  [IF EXISTS] [catalog_name.][db_name.]view_name;
+
+SHOW VIEWS;
+```
+
+{{< /tab >}}
+
+{{< /tabs >}}
 
 ## Format Table
 
diff --git a/docs/content/flink/savepoint.md b/docs/content/flink/savepoint.md
index a0934df134535..b9d353c1de33d 100644
--- a/docs/content/flink/savepoint.md
+++ b/docs/content/flink/savepoint.md
@@ -70,7 +70,7 @@ to learn how to configure and trigger savepoint.
 **Step 3: Choose the tag corresponding to the savepoint.**
 
 The tag corresponding to the savepoint will be named in the form of `savepoint-${savepointID}`. You can refer to
-[Tags Table]({{< ref "maintenance/system-tables#tags-table" >}}) to query.
+[Tags Table]({{< ref "concepts/system-tables#tags-table" >}}) to query.
 
 **Step 4: Rollback the paimon table.**
 
diff --git a/docs/content/primary-key-table/query-performance.md b/docs/content/primary-key-table/query-performance.md
index fd6bdeeeb8954..dea4899360aba 100644
--- a/docs/content/primary-key-table/query-performance.md
+++ b/docs/content/primary-key-table/query-performance.md
@@ -33,7 +33,7 @@ The table schema has the greatest impact on query performance. See [Table Mode](
 For Merge On Read table, the most important thing you should pay attention to is the number of buckets, which will limit
 the concurrency of reading data.
 
-For MOW (Deletion Vectors) or COW table or [Read Optimized]({{< ref "maintenance/system-tables#read-optimized-table" >}}) table,
+For MOW (Deletion Vectors) or COW table or [Read Optimized]({{< ref "concepts/system-tables#read-optimized-table" >}}) table,
 There is no limit to the concurrency of reading data, and they can also utilize some filtering conditions for non-primary-key columns.
 
 ## Data Skipping By Primary Key Filter
diff --git a/docs/content/primary-key-table/table-mode.md b/docs/content/primary-key-table/table-mode.md
index d7bc2efb91091..c8cce7c8bce54 100644
--- a/docs/content/primary-key-table/table-mode.md
+++ b/docs/content/primary-key-table/table-mode.md
@@ -110,7 +110,7 @@ If you don't want to use Deletion Vectors mode, you want to query fast enough in
 older data, you can also:
 
 1. Configure 'compaction.optimization-interval' when writing data.
-2. Query from [read-optimized system table]({{< ref "maintenance/system-tables#read-optimized-table" >}}). Reading from
+2. Query from [read-optimized system table]({{< ref "concepts/system-tables#read-optimized-table" >}}). Reading from
    results of optimized files avoids merging records with the same key, thus improving reading performance.
 
 You can flexibly balance query performance and data latency when reading.

From 848cb59562bdbc9c5f0216bba689745d73d5f514 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 19 Nov 2024 14:06:03 +0800
Subject: [PATCH 030/157] [doc] Simplify chapter name in iceberg compatibility

---
 docs/content/migration/iceberg-compatibility.md | 14 +++++---------
 1 file changed, 5 insertions(+), 9 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 17e1c65233988..f07f78cb201df 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -29,8 +29,6 @@ under the License.
 Paimon supports generating Iceberg compatible metadata,
 so that Paimon tables can be consumed directly by Iceberg readers.
 
-## Enable Iceberg Compatibility
-
 Set the following table options, so that Paimon tables can generate Iceberg compatible metadata.
 
 <table class="table table-bordered">
@@ -66,7 +64,7 @@ so that all tables can be visited as an Iceberg warehouse.
 For Iceberg Java API users, you might consider setting `'metadata.iceberg.storage' = 'table-location'`,
 so you can visit each table with its table path.
 
-## Example: Query Paimon Append Only Tables on Flink/Spark with Iceberg Connector
+## Append Tables
 
 Let's walk through a simple example, where we query Paimon tables with Iceberg connectors in Flink and Spark.
 Before trying out this example, make sure that your compute engine already supports Iceberg.
@@ -200,7 +198,7 @@ germany hamburg
 
 {{< /tabs >}}
 
-## Example: Query Paimon Primary Key Tables on Flink/Spark with Iceberg Connector
+## Primary Key Tables
 
 {{< tabs "paimon-primary-key-table" >}}
 
@@ -300,8 +298,6 @@ SELECT * FROM iceberg_catalog.`default`.orders WHERE status = 'COMPLETED';
 
 {{< /tabs >}}
 
-### Timeliness
-
 Paimon primary key tables organize data files as LSM trees, so data files must be merged in memory before querying.
 However, Iceberg readers are not able to merge data files, so they can only query data files on the highest level of LSM trees.
 Data files on the highest level are produced by the full compaction process.
@@ -338,7 +334,7 @@ You can configure the following table option, so that Paimon is forced to perfor
 Note that full compaction is a resource-consuming process, so the value of this table option should not be too small.
 We recommend full compaction to be performed once or twice per hour.
 
-## Access Paimon Table from Iceberg Hive Catalog
+## Hive Catalog
 
 When creating Paimon table, set `'metadata.iceberg.storage' = 'hive-catalog'`.
 This option value not only store Iceberg metadata like hadoop-catalog, but also create Iceberg external table in Hive.
@@ -378,7 +374,7 @@ you also need to set some (or all) of the following table options when creating
     </tbody>
 </table>
 
-## Example: Query Paimon Append Only Tables on Trino with Iceberg Connector
+## Trino Iceberg
 
 In this example, we use Trino Iceberg connector to access Paimon table through Iceberg Hive catalog.
 Before trying out this example, make sure that you have configured Trino Iceberg connector.
@@ -473,7 +469,7 @@ Paimon Iceberg compatibility currently supports the following data types.
 
 *: `TIMESTAMP` and `TIMESTAMP_LTZ` type only support precision from 4 to 6
 
-## Other Related Table Options
+## Table Options
 
 <table class="table table-bordered">
     <thead>

From d9d8d837028c63666ccdec4d22677a8d869a3d77 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Tue, 19 Nov 2024 15:29:18 +0800
Subject: [PATCH 031/157] [avro] Writer throw more clear exception when NPE
 with aggregation merge function (#4547)

---
 .../apache/paimon/io/SingleFileWriter.java    | 23 ++++++++++++----
 .../flink/ContinuousFileStoreITCase.java      | 27 +++++++++++++++++++
 .../format/avro/AvroRowDatumWriter.java       | 11 +++++++-
 3 files changed, 55 insertions(+), 6 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/SingleFileWriter.java b/paimon-core/src/main/java/org/apache/paimon/io/SingleFileWriter.java
index d41040e05bb78..f303e8597870c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/SingleFileWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/SingleFileWriter.java
@@ -49,7 +49,7 @@ public abstract class SingleFileWriter<T, R> implements FileWriter<T, R> {
     protected final Path path;
     private final Function<T, InternalRow> converter;
 
-    private final FormatWriter writer;
+    private FormatWriter writer;
     private PositionOutputStream out;
 
     private long recordCount;
@@ -144,7 +144,14 @@ public boolean reachTargetSize(boolean suggestedCheck, long targetSize) throws I
 
     @Override
     public void abort() {
-        IOUtils.closeQuietly(out);
+        if (writer != null) {
+            IOUtils.closeQuietly(writer);
+            writer = null;
+        }
+        if (out != null) {
+            IOUtils.closeQuietly(out);
+            out = null;
+        }
         fileIO.deleteQuietly(path);
     }
 
@@ -167,9 +174,15 @@ public void close() throws IOException {
         }
 
         try {
-            writer.close();
-            out.flush();
-            out.close();
+            if (writer != null) {
+                writer.close();
+                writer = null;
+            }
+            if (out != null) {
+                out.flush();
+                out.close();
+                out = null;
+            }
         } catch (IOException e) {
             LOG.warn("Exception occurs when closing file {}. Cleaning up.", path, e);
             abort();
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
index cf97f7b67d4d1..2e15697511dd0 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
@@ -28,6 +28,7 @@
 
 import org.apache.flink.table.api.StatementSet;
 import org.apache.flink.table.api.ValidationException;
+import org.apache.flink.table.planner.factories.TestValuesTableFactory;
 import org.apache.flink.types.Row;
 import org.apache.flink.types.RowKind;
 import org.apache.flink.util.CloseableIterator;
@@ -43,6 +44,7 @@
 import java.util.Set;
 import java.util.stream.Collectors;
 
+import static org.apache.paimon.testutils.assertj.PaimonAssertions.anyCauseMatches;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
@@ -629,4 +631,29 @@ public void testScanFromChangelog(String changelogProducer) throws Exception {
         assertThat(iterator.collect(1)).containsExactlyInAnyOrder(Row.of("10", "11", "12"));
         iterator.close();
     }
+
+    @Test
+    public void testAvroRetractNotNullField() {
+        List<Row> input =
+                Arrays.asList(
+                        Row.ofKind(RowKind.INSERT, 1, "A"), Row.ofKind(RowKind.DELETE, 1, "A"));
+        String id = TestValuesTableFactory.registerData(input);
+        sEnv.executeSql(
+                String.format(
+                        "CREATE TEMPORARY TABLE source (pk INT PRIMARY KEY NOT ENFORCED, a STRING) "
+                                + "WITH ('connector'='values', 'bounded'='true', 'data-id'='%s', "
+                                + "'changelog-mode' = 'I,D,UA,UB')",
+                        id));
+
+        sql(
+                "CREATE TABLE avro_sink (pk INT PRIMARY KEY NOT ENFORCED, a STRING NOT NULL) "
+                        + " WITH ('file.format' = 'avro', 'merge-engine' = 'aggregation')");
+
+        assertThatThrownBy(
+                        () -> sEnv.executeSql("INSERT INTO avro_sink select * from source").await())
+                .satisfies(
+                        anyCauseMatches(
+                                RuntimeException.class,
+                                "Caught NullPointerException, the possible reason is you have set following options together"));
+    }
 }
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroRowDatumWriter.java b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroRowDatumWriter.java
index c2bd81d0038fd..d302451625720 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroRowDatumWriter.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroRowDatumWriter.java
@@ -56,6 +56,15 @@ public void write(InternalRow datum, Encoder out) throws IOException {
             // top Row is a UNION type
             out.writeIndex(1);
         }
-        this.writer.writeRow(datum, out);
+        try {
+            this.writer.writeRow(datum, out);
+        } catch (NullPointerException npe) {
+            throw new RuntimeException(
+                    "Caught NullPointerException, the possible reason is you have set following options together:\n"
+                            + "  1. file.format = avro;\n"
+                            + "  2. merge-function = aggregation/partial-update;\n"
+                            + "  3. some fields are not null.",
+                    npe);
+        }
     }
 }

From 1d3844605ab71d328d1519e08ebc350eeaaa5f5a Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Tue, 19 Nov 2024 15:37:54 +0800
Subject: [PATCH 032/157] [core] Drop stats in manifest file reading (#4534)

---
 docs/content/maintenance/metrics.md           |  10 -
 .../java/org/apache/paimon/utils/Filter.java  |   7 +
 .../apache/paimon/utils/ThreadPoolUtils.java  |   6 +-
 ...awareAppendTableCompactionCoordinator.java |   8 +-
 .../org/apache/paimon/manifest/FileEntry.java |  25 ++-
 .../manifest/FilteredManifestEntry.java       |  34 +++
 .../apache/paimon/manifest/ManifestFile.java  |  13 --
 .../operation/AbstractFileStoreScan.java      | 209 +++++++++++-------
 .../operation/AppendOnlyFileStoreScan.java    |   7 -
 .../paimon/operation/FileStoreScan.java       |   2 +
 .../operation/KeyValueFileStoreScan.java      |  38 +++-
 .../operation/LocalOrphanFilesClean.java      |   4 +-
 .../paimon/operation/metrics/ScanMetrics.java |  12 -
 .../paimon/operation/metrics/ScanStats.java   |  22 +-
 .../paimon/table/sink/TableCommitImpl.java    |   4 +-
 .../table/source/DataTableBatchScan.java      |   2 +-
 .../snapshot/IncrementalStartingScanner.java  |   6 +-
 .../table/source/snapshot/SnapshotReader.java |   2 +
 .../source/snapshot/SnapshotReaderImpl.java   |   6 +
 .../paimon/table/system/AuditLogTable.java    |   6 +
 .../table/system/ReadOptimizedTable.java      |   3 +-
 .../paimon/utils/ManifestReadThreadPool.java  |   4 +-
 .../org/apache/paimon/utils/ObjectsCache.java |  17 +-
 .../org/apache/paimon/utils/ObjectsFile.java  |  27 ++-
 .../operation/metrics/ScanMetricsTest.java    |  26 +--
 .../table/PrimaryKeyFileStoreTableTest.java   |  17 --
 .../apache/paimon/utils/ObjectsCacheTest.java |  18 +-
 .../source/ContinuousFileStoreSource.java     |   2 +-
 .../flink/source/FlinkSourceBuilder.java      |   2 +-
 .../paimon/flink/source/FlinkTableSource.java |  20 +-
 .../flink/source/StaticFileStoreSource.java   |   2 +-
 .../source/operator/MonitorFunction.java      |   2 +-
 .../paimon/hive/utils/HiveSplitGenerator.java |   3 +-
 .../spark/ColumnPruningAndPushDown.scala      |   2 +-
 .../PaimonAnalyzeTableColumnCommand.scala     |   7 +-
 .../paimon/spark/sources/StreamHelper.scala   |   3 +-
 36 files changed, 323 insertions(+), 255 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/manifest/FilteredManifestEntry.java

diff --git a/docs/content/maintenance/metrics.md b/docs/content/maintenance/metrics.md
index 139bdfff6bfe0..2c3067267fd75 100644
--- a/docs/content/maintenance/metrics.md
+++ b/docs/content/maintenance/metrics.md
@@ -67,16 +67,6 @@ Below is lists of Paimon built-in metrics. They are summarized into types of sca
             <td>Gauge</td>
             <td>Number of scanned manifest files in the last scan.</td>
         </tr>
-        <tr>
-            <td>lastSkippedByPartitionAndStats</td>
-            <td>Gauge</td>
-            <td>Skipped table files by partition filter and value / key stats information in the last scan.</td>
-        </tr>
-        <tr>
-            <td>lastSkippedByWholeBucketFilesFilter</td>
-            <td>Gauge</td>
-            <td>Skipped table files by bucket level value filter (only primary key table) in the last scan.</td>
-        </tr>
         <tr>
             <td>lastScanSkippedTableFiles</td>
             <td>Gauge</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/Filter.java b/paimon-common/src/main/java/org/apache/paimon/utils/Filter.java
index 2764bc77363ac..4d9416252e0f7 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/Filter.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/Filter.java
@@ -37,6 +37,13 @@ public interface Filter<T> {
      */
     boolean test(T t);
 
+    default Filter<T> and(Filter<? super T> other) {
+        if (other == null) {
+            return this;
+        }
+        return t -> test(t) && other.test(t);
+    }
+
     @SuppressWarnings({"unchecked", "rawtypes"})
     static <T> Filter<T> alwaysTrue() {
         return (Filter) ALWAYS_TRUE;
diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
index 02b5d73fcf2cc..112b9ad1cda28 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
@@ -110,7 +110,9 @@ private void advanceIfNeeded() {
                                 if (stack.isEmpty()) {
                                     return;
                                 }
-                                activeList = randomlyExecute(executor, processor, stack.poll());
+                                activeList =
+                                        randomlyExecuteSequentialReturn(
+                                                executor, processor, stack.poll());
                             }
                         }
                     }
@@ -132,7 +134,7 @@ public static <U> void randomlyOnlyExecute(
         awaitAllFutures(futures);
     }
 
-    public static <U, T> Iterator<T> randomlyExecute(
+    public static <U, T> Iterator<T> randomlyExecuteSequentialReturn(
             ExecutorService executor, Function<U, List<T>> processor, Collection<U> input) {
         List<Future<List<T>>> futures = new ArrayList<>(input.size());
         ClassLoader cl = Thread.currentThread().getContextClassLoader();
diff --git a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
index 842b223167b27..577f28d0f5cff 100644
--- a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
+++ b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
@@ -27,6 +27,7 @@
 import org.apache.paimon.index.IndexFileHandler;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.io.DataFileMeta;
+import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.table.FileStoreTable;
@@ -441,7 +442,12 @@ public ManifestEntry next() {
                 }
 
                 if (currentIterator.hasNext()) {
-                    return currentIterator.next();
+                    ManifestEntry entry = currentIterator.next();
+                    if (entry.kind() == FileKind.DELETE) {
+                        continue;
+                    } else {
+                        return entry;
+                    }
                 }
                 currentIterator = null;
             }
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
index 3b3e514e0a1e2..91e07a369da20 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
@@ -28,15 +28,17 @@
 
 import java.util.Arrays;
 import java.util.Collection;
-import java.util.HashSet;
+import java.util.Iterator;
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
 import java.util.Set;
+import java.util.concurrent.ConcurrentHashMap;
 import java.util.function.Function;
 import java.util.stream.Collectors;
 
+import static org.apache.paimon.utils.ManifestReadThreadPool.randomlyExecuteSequentialReturn;
 import static org.apache.paimon.utils.ManifestReadThreadPool.sequentialBatchedExecute;
 
 /** Entry representing a file. */
@@ -214,7 +216,11 @@ static Set<Identifier> readDeletedEntries(
         return readDeletedEntries(
                 m ->
                         manifestFile.read(
-                                m.fileName(), m.fileSize(), Filter.alwaysTrue(), deletedFilter()),
+                                m.fileName(),
+                                m.fileSize(),
+                                Filter.alwaysTrue(),
+                                deletedFilter(),
+                                Filter.alwaysTrue()),
                 manifestFiles,
                 manifestReadParallelism);
     }
@@ -234,11 +240,11 @@ static <T extends FileEntry> Set<Identifier> readDeletedEntries(
                                 .filter(e -> e.kind() == FileKind.DELETE)
                                 .map(FileEntry::identifier)
                                 .collect(Collectors.toList());
-        Iterable<Identifier> identifiers =
-                sequentialBatchedExecute(processor, manifestFiles, manifestReadParallelism);
-        Set<Identifier> result = new HashSet<>();
-        for (Identifier identifier : identifiers) {
-            result.add(identifier);
+        Iterator<Identifier> identifiers =
+                randomlyExecuteSequentialReturn(processor, manifestFiles, manifestReadParallelism);
+        Set<Identifier> result = ConcurrentHashMap.newKeySet();
+        while (identifiers.hasNext()) {
+            result.add(identifiers.next());
         }
         return result;
     }
@@ -247,4 +253,9 @@ static Filter<InternalRow> deletedFilter() {
         Function<InternalRow, FileKind> getter = ManifestEntrySerializer.kindGetter();
         return row -> getter.apply(row) == FileKind.DELETE;
     }
+
+    static Filter<InternalRow> addFilter() {
+        Function<InternalRow, FileKind> getter = ManifestEntrySerializer.kindGetter();
+        return row -> getter.apply(row) == FileKind.ADD;
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/FilteredManifestEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/FilteredManifestEntry.java
new file mode 100644
index 0000000000000..29ae6f6389c6b
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/FilteredManifestEntry.java
@@ -0,0 +1,34 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.manifest;
+
+/** Wrap a {@link ManifestEntry} to contain {@link #selected}. */
+public class FilteredManifestEntry extends ManifestEntry {
+
+    private final boolean selected;
+
+    public FilteredManifestEntry(ManifestEntry entry, boolean selected) {
+        super(entry.kind(), entry.partition(), entry.bucket(), entry.totalBuckets(), entry.file());
+        this.selected = selected;
+    }
+
+    public boolean selected() {
+        return selected;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
index 38181a8234aa9..128f5262a5537 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
@@ -211,18 +211,5 @@ public ManifestFile create() {
                     suggestedFileSize,
                     cache);
         }
-
-        public ObjectsFile<SimpleFileEntry> createSimpleFileEntryReader() {
-            RowType entryType = VersionedObjectSerializer.versionType(ManifestEntry.SCHEMA);
-            return new ObjectsFile<>(
-                    fileIO,
-                    new SimpleFileEntrySerializer(),
-                    entryType,
-                    fileFormat.createReaderFactory(entryType),
-                    fileFormat.createWriterFactory(entryType),
-                    compression,
-                    pathFactory.manifestFileFactory(),
-                    cache);
-        }
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
index 0e1f9357e312c..98e064451509b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
@@ -23,7 +23,7 @@
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.manifest.BucketEntry;
 import org.apache.paimon.manifest.FileEntry;
-import org.apache.paimon.manifest.FileKind;
+import org.apache.paimon.manifest.FileEntry.Identifier;
 import org.apache.paimon.manifest.ManifestCacheFilter;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestEntrySerializer;
@@ -43,8 +43,6 @@
 import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.SnapshotManager;
 
-import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
-
 import javax.annotation.Nullable;
 
 import java.util.ArrayList;
@@ -62,6 +60,7 @@
 import java.util.stream.Collectors;
 
 import static org.apache.paimon.utils.ManifestReadThreadPool.getExecutorService;
+import static org.apache.paimon.utils.ManifestReadThreadPool.randomlyExecuteSequentialReturn;
 import static org.apache.paimon.utils.ManifestReadThreadPool.sequentialBatchedExecute;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
 import static org.apache.paimon.utils.Preconditions.checkState;
@@ -193,6 +192,11 @@ public FileStoreScan withLevelFilter(Filter<Integer> levelFilter) {
         return this;
     }
 
+    @Override
+    public FileStoreScan enableValueFilter() {
+        return this;
+    }
+
     @Override
     public FileStoreScan withManifestEntryFilter(Filter<ManifestEntry> filter) {
         this.manifestEntryFilter = filter;
@@ -241,47 +245,46 @@ public Plan plan() {
         Snapshot snapshot = manifestsResult.snapshot;
         List<ManifestFileMeta> manifests = manifestsResult.filteredManifests;
 
-        long startDataFiles =
-                manifestsResult.allManifests.stream()
-                        .mapToLong(f -> f.numAddedFiles() - f.numDeletedFiles())
-                        .sum();
-
-        Collection<ManifestEntry> mergedEntries =
-                readAndMergeFileEntries(manifests, this::readManifest);
-
-        long skippedByPartitionAndStats = startDataFiles - mergedEntries.size();
-
-        // We group files by bucket here, and filter them by the whole bucket filter.
-        // Why do this: because in primary key table, we can't just filter the value
-        // by the stat in files (see `PrimaryKeyFileStoreTable.nonPartitionFilterConsumer`),
-        // but we can do this by filter the whole bucket files
-        List<ManifestEntry> files =
-                mergedEntries.stream()
-                        .collect(
-                                Collectors.groupingBy(
-                                        // we use LinkedHashMap to avoid disorder
-                                        file -> Pair.of(file.partition(), file.bucket()),
-                                        LinkedHashMap::new,
-                                        Collectors.toList()))
-                        .values()
-                        .stream()
-                        .map(this::filterWholeBucketByStats)
-                        .flatMap(Collection::stream)
-                        .collect(Collectors.toList());
+        Iterator<ManifestEntry> iterator = readManifestEntries(manifests, false);
+        List<ManifestEntry> files = new ArrayList<>();
+        while (iterator.hasNext()) {
+            files.add(iterator.next());
+        }
+
+        if (wholeBucketFilterEnabled()) {
+            // We group files by bucket here, and filter them by the whole bucket filter.
+            // Why do this: because in primary key table, we can't just filter the value
+            // by the stat in files (see `PrimaryKeyFileStoreTable.nonPartitionFilterConsumer`),
+            // but we can do this by filter the whole bucket files
+            files =
+                    files.stream()
+                            .collect(
+                                    Collectors.groupingBy(
+                                            // we use LinkedHashMap to avoid disorder
+                                            file -> Pair.of(file.partition(), file.bucket()),
+                                            LinkedHashMap::new,
+                                            Collectors.toList()))
+                            .values()
+                            .stream()
+                            .map(this::filterWholeBucketByStats)
+                            .flatMap(Collection::stream)
+                            .collect(Collectors.toList());
+        }
+
+        List<ManifestEntry> result = files;
 
-        long skippedByWholeBucketFiles = mergedEntries.size() - files.size();
         long scanDuration = (System.nanoTime() - started) / 1_000_000;
-        checkState(
-                startDataFiles - skippedByPartitionAndStats - skippedByWholeBucketFiles
-                        == files.size());
         if (scanMetrics != null) {
+            long allDataFiles =
+                    manifestsResult.allManifests.stream()
+                            .mapToLong(f -> f.numAddedFiles() - f.numDeletedFiles())
+                            .sum();
             scanMetrics.reportScan(
                     new ScanStats(
                             scanDuration,
                             manifests.size(),
-                            skippedByPartitionAndStats,
-                            skippedByWholeBucketFiles,
-                            files.size()));
+                            allDataFiles - result.size(),
+                            result.size()));
         }
 
         return new Plan() {
@@ -299,12 +302,7 @@ public Snapshot snapshot() {
 
             @Override
             public List<ManifestEntry> files() {
-                if (dropStats) {
-                    return files.stream()
-                            .map(ManifestEntry::copyWithoutStats)
-                            .collect(Collectors.toList());
-                }
-                return files;
+                return result;
             }
         };
     }
@@ -312,9 +310,15 @@ public List<ManifestEntry> files() {
     @Override
     public List<SimpleFileEntry> readSimpleEntries() {
         List<ManifestFileMeta> manifests = readManifests().filteredManifests;
-        Collection<SimpleFileEntry> mergedEntries =
-                readAndMergeFileEntries(manifests, this::readSimpleEntries);
-        return new ArrayList<>(mergedEntries);
+        Iterator<SimpleFileEntry> iterator =
+                scanMode == ScanMode.ALL
+                        ? readAndMergeFileEntries(manifests, SimpleFileEntry::from, false)
+                        : readAndNoMergeFileEntries(manifests, SimpleFileEntry::from, false);
+        List<SimpleFileEntry> result = new ArrayList<>();
+        while (iterator.hasNext()) {
+            result.add(iterator.next());
+        }
+        return result;
     }
 
     @Override
@@ -343,23 +347,57 @@ public List<BucketEntry> readBucketEntries() {
 
     @Override
     public Iterator<ManifestEntry> readFileIterator() {
-        List<ManifestFileMeta> manifests = readManifests().filteredManifests;
-        Set<FileEntry.Identifier> deleteEntries =
-                FileEntry.readDeletedEntries(this::readSimpleEntries, manifests, parallelism);
-        Iterator<ManifestEntry> iterator =
-                sequentialBatchedExecute(this::readManifest, manifests, parallelism).iterator();
-        return Iterators.filter(
-                iterator,
-                entry ->
-                        entry != null
-                                && entry.kind() == FileKind.ADD
-                                && !deleteEntries.contains(entry.identifier()));
+        // useSequential: reduce memory and iterator can be stopping
+        return readManifestEntries(readManifests().filteredManifests, true);
+    }
+
+    private Iterator<ManifestEntry> readManifestEntries(
+            List<ManifestFileMeta> manifests, boolean useSequential) {
+        return scanMode == ScanMode.ALL
+                ? readAndMergeFileEntries(manifests, Function.identity(), useSequential)
+                : readAndNoMergeFileEntries(manifests, Function.identity(), useSequential);
+    }
+
+    private <T extends FileEntry> Iterator<T> readAndMergeFileEntries(
+            List<ManifestFileMeta> manifests,
+            Function<List<ManifestEntry>, List<T>> converter,
+            boolean useSequential) {
+        Set<Identifier> deletedEntries =
+                FileEntry.readDeletedEntries(
+                        manifest -> readManifest(manifest, FileEntry.deletedFilter(), null),
+                        manifests,
+                        parallelism);
+
+        manifests =
+                manifests.stream()
+                        .filter(file -> file.numAddedFiles() > 0)
+                        .collect(Collectors.toList());
+
+        Function<ManifestFileMeta, List<T>> processor =
+                manifest ->
+                        converter.apply(
+                                readManifest(
+                                        manifest,
+                                        FileEntry.addFilter(),
+                                        entry -> !deletedEntries.contains(entry.identifier())));
+        if (useSequential) {
+            return sequentialBatchedExecute(processor, manifests, parallelism).iterator();
+        } else {
+            return randomlyExecuteSequentialReturn(processor, manifests, parallelism);
+        }
     }
 
-    public <T extends FileEntry> Collection<T> readAndMergeFileEntries(
-            List<ManifestFileMeta> manifests, Function<ManifestFileMeta, List<T>> manifestReader) {
-        return FileEntry.mergeEntries(
-                sequentialBatchedExecute(manifestReader, manifests, parallelism));
+    private <T extends FileEntry> Iterator<T> readAndNoMergeFileEntries(
+            List<ManifestFileMeta> manifests,
+            Function<List<ManifestEntry>, List<T>> converter,
+            boolean useSequential) {
+        Function<ManifestFileMeta, List<T>> reader =
+                manifest -> converter.apply(readManifest(manifest));
+        if (useSequential) {
+            return sequentialBatchedExecute(reader, manifests, parallelism).iterator();
+        } else {
+            return randomlyExecuteSequentialReturn(reader, manifests, parallelism);
+        }
     }
 
     private ManifestsReader.Result readManifests() {
@@ -384,12 +422,24 @@ protected TableSchema scanTableSchema(long id) {
     /** Note: Keep this thread-safe. */
     protected abstract boolean filterByStats(ManifestEntry entry);
 
-    /** Note: Keep this thread-safe. */
-    protected abstract List<ManifestEntry> filterWholeBucketByStats(List<ManifestEntry> entries);
+    protected boolean wholeBucketFilterEnabled() {
+        return false;
+    }
+
+    protected List<ManifestEntry> filterWholeBucketByStats(List<ManifestEntry> entries) {
+        return entries;
+    }
 
     /** Note: Keep this thread-safe. */
     @Override
     public List<ManifestEntry> readManifest(ManifestFileMeta manifest) {
+        return readManifest(manifest, null, null);
+    }
+
+    private List<ManifestEntry> readManifest(
+            ManifestFileMeta manifest,
+            @Nullable Filter<InternalRow> additionalFilter,
+            @Nullable Filter<ManifestEntry> additionalTFilter) {
         List<ManifestEntry> entries =
                 manifestFileFactory
                         .create()
@@ -397,29 +447,24 @@ public List<ManifestEntry> readManifest(ManifestFileMeta manifest) {
                                 manifest.fileName(),
                                 manifest.fileSize(),
                                 createCacheRowFilter(),
-                                createEntryRowFilter());
-        List<ManifestEntry> filteredEntries = new ArrayList<>(entries.size());
-        for (ManifestEntry entry : entries) {
-            if ((manifestEntryFilter == null || manifestEntryFilter.test(entry))
-                    && filterByStats(entry)) {
-                filteredEntries.add(entry);
+                                createEntryRowFilter().and(additionalFilter),
+                                entry ->
+                                        (additionalTFilter == null || additionalTFilter.test(entry))
+                                                && (manifestEntryFilter == null
+                                                        || manifestEntryFilter.test(entry))
+                                                && filterByStats(entry));
+        if (dropStats) {
+            List<ManifestEntry> copied = new ArrayList<>(entries.size());
+            for (ManifestEntry entry : entries) {
+                copied.add(dropStats(entry));
             }
+            entries = copied;
         }
-        return filteredEntries;
+        return entries;
     }
 
-    /** Note: Keep this thread-safe. */
-    private List<SimpleFileEntry> readSimpleEntries(ManifestFileMeta manifest) {
-        return manifestFileFactory
-                .createSimpleFileEntryReader()
-                .read(
-                        manifest.fileName(),
-                        manifest.fileSize(),
-                        // use filter for ManifestEntry
-                        // currently, projection is not pushed down to file format
-                        // see SimpleFileEntrySerializer
-                        createCacheRowFilter(),
-                        createEntryRowFilter());
+    protected ManifestEntry dropStats(ManifestEntry entry) {
+        return entry.copyWithoutStats();
     }
 
     /**
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreScan.java
index 60b4e7933cb19..d2ca5da42249a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreScan.java
@@ -34,7 +34,6 @@
 
 import java.io.IOException;
 import java.util.HashMap;
-import java.util.List;
 import java.util.Map;
 
 /** {@link FileStoreScan} for {@link AppendOnlyFileStore}. */
@@ -100,12 +99,6 @@ protected boolean filterByStats(ManifestEntry entry) {
                 && (!fileIndexReadEnabled || testFileIndex(entry.file().embeddedIndex(), entry));
     }
 
-    @Override
-    protected List<ManifestEntry> filterWholeBucketByStats(List<ManifestEntry> entries) {
-        // We don't need to filter per-bucket entries here
-        return entries;
-    }
-
     private boolean testFileIndex(@Nullable byte[] embeddedIndexBytes, ManifestEntry entry) {
         if (embeddedIndexBytes == null) {
             return true;
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
index e643bf1617b4d..7663f48229c63 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
@@ -73,6 +73,8 @@ public interface FileStoreScan {
 
     FileStoreScan withLevelFilter(Filter<Integer> levelFilter);
 
+    FileStoreScan enableValueFilter();
+
     FileStoreScan withManifestEntryFilter(Filter<ManifestEntry> filter);
 
     FileStoreScan withManifestCacheFilter(ManifestCacheFilter manifestFilter);
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/KeyValueFileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/KeyValueFileStoreScan.java
index c368d9e510b02..8d8c51996cfe9 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/KeyValueFileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/KeyValueFileStoreScan.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.KeyValueFileStore;
 import org.apache.paimon.fileindex.FileIndexPredicate;
 import org.apache.paimon.io.DataFileMeta;
+import org.apache.paimon.manifest.FilteredManifestEntry;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.predicate.Predicate;
@@ -45,7 +46,6 @@
 import java.util.Map;
 
 import static org.apache.paimon.CoreOptions.MergeEngine.AGGREGATE;
-import static org.apache.paimon.CoreOptions.MergeEngine.FIRST_ROW;
 import static org.apache.paimon.CoreOptions.MergeEngine.PARTIAL_UPDATE;
 
 /** {@link FileStoreScan} for {@link KeyValueFileStore}. */
@@ -64,6 +64,8 @@ public class KeyValueFileStoreScan extends AbstractFileStoreScan {
     private final boolean fileIndexReadEnabled;
     private final Map<Long, Predicate> schemaId2DataFilter = new HashMap<>();
 
+    private boolean valueFilterForceEnabled = false;
+
     public KeyValueFileStoreScan(
             ManifestsReader manifestsReader,
             BucketSelectConverter bucketSelectConverter,
@@ -110,11 +112,17 @@ public KeyValueFileStoreScan withValueFilter(Predicate predicate) {
         return this;
     }
 
+    @Override
+    public FileStoreScan enableValueFilter() {
+        this.valueFilterForceEnabled = true;
+        return this;
+    }
+
     /** Note: Keep this thread-safe. */
     @Override
     protected boolean filterByStats(ManifestEntry entry) {
         DataFileMeta file = entry.file();
-        if (isValueFilterEnabled(entry) && !filterByValueFilter(entry)) {
+        if (isValueFilterEnabled() && !filterByValueFilter(entry)) {
             return false;
         }
 
@@ -130,6 +138,14 @@ protected boolean filterByStats(ManifestEntry entry) {
         return true;
     }
 
+    @Override
+    protected ManifestEntry dropStats(ManifestEntry entry) {
+        if (!isValueFilterEnabled() && wholeBucketFilterEnabled()) {
+            return new FilteredManifestEntry(entry.copyWithoutStats(), filterByValueFilter(entry));
+        }
+        return entry.copyWithoutStats();
+    }
+
     private boolean filterByFileIndex(@Nullable byte[] embeddedIndexBytes, ManifestEntry entry) {
         if (embeddedIndexBytes == null) {
             return true;
@@ -150,14 +166,14 @@ private boolean filterByFileIndex(@Nullable byte[] embeddedIndexBytes, ManifestE
         }
     }
 
-    private boolean isValueFilterEnabled(ManifestEntry entry) {
+    private boolean isValueFilterEnabled() {
         if (valueFilter == null) {
             return false;
         }
 
         switch (scanMode) {
             case ALL:
-                return (deletionVectorsEnabled || mergeEngine == FIRST_ROW) && entry.level() > 0;
+                return valueFilterForceEnabled;
             case DELTA:
                 return false;
             case CHANGELOG:
@@ -168,13 +184,13 @@ private boolean isValueFilterEnabled(ManifestEntry entry) {
         }
     }
 
-    /** Note: Keep this thread-safe. */
     @Override
-    protected List<ManifestEntry> filterWholeBucketByStats(List<ManifestEntry> entries) {
-        if (valueFilter == null || scanMode != ScanMode.ALL) {
-            return entries;
-        }
+    protected boolean wholeBucketFilterEnabled() {
+        return valueFilter != null && scanMode == ScanMode.ALL;
+    }
 
+    @Override
+    protected List<ManifestEntry> filterWholeBucketByStats(List<ManifestEntry> entries) {
         return noOverlapping(entries)
                 ? filterWholeBucketPerFile(entries)
                 : filterWholeBucketAllFiles(entries);
@@ -207,6 +223,10 @@ private List<ManifestEntry> filterWholeBucketAllFiles(List<ManifestEntry> entrie
     }
 
     private boolean filterByValueFilter(ManifestEntry entry) {
+        if (entry instanceof FilteredManifestEntry) {
+            return ((FilteredManifestEntry) entry).selected();
+        }
+
         DataFileMeta file = entry.file();
         SimpleStatsEvolution.Result result =
                 fieldValueStatsConverters
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
index 3ee108c10359a..a5eea6d650cf9 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
@@ -53,7 +53,7 @@
 
 import static org.apache.paimon.utils.Preconditions.checkArgument;
 import static org.apache.paimon.utils.ThreadPoolUtils.createCachedThreadPool;
-import static org.apache.paimon.utils.ThreadPoolUtils.randomlyExecute;
+import static org.apache.paimon.utils.ThreadPoolUtils.randomlyExecuteSequentialReturn;
 import static org.apache.paimon.utils.ThreadPoolUtils.randomlyOnlyExecute;
 
 /**
@@ -180,7 +180,7 @@ private Map<String, Path> getCandidateDeletingFiles() {
                                 .filter(this::oldEnough)
                                 .map(FileStatus::getPath)
                                 .collect(Collectors.toList());
-        Iterator<Path> allPaths = randomlyExecute(executor, processor, fileDirs);
+        Iterator<Path> allPaths = randomlyExecuteSequentialReturn(executor, processor, fileDirs);
         Map<String, Path> result = new HashMap<>();
         while (allPaths.hasNext()) {
             Path next = allPaths.next();
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanMetrics.java b/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanMetrics.java
index 9fcbb8960fc50..96f0aec1c0b21 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanMetrics.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanMetrics.java
@@ -49,12 +49,6 @@ public MetricGroup getMetricGroup() {
     public static final String SCAN_DURATION = "scanDuration";
     public static final String LAST_SCANNED_MANIFESTS = "lastScannedManifests";
 
-    public static final String LAST_SKIPPED_BY_PARTITION_AND_STATS =
-            "lastSkippedByPartitionAndStats";
-
-    public static final String LAST_SKIPPED_BY_WHOLE_BUCKET_FILES_FILTER =
-            "lastSkippedByWholeBucketFilesFilter";
-
     public static final String LAST_SCAN_SKIPPED_TABLE_FILES = "lastScanSkippedTableFiles";
 
     public static final String LAST_SCAN_RESULTED_TABLE_FILES = "lastScanResultedTableFiles";
@@ -66,12 +60,6 @@ private void registerGenericScanMetrics() {
         metricGroup.gauge(
                 LAST_SCANNED_MANIFESTS,
                 () -> latestScan == null ? 0L : latestScan.getScannedManifests());
-        metricGroup.gauge(
-                LAST_SKIPPED_BY_PARTITION_AND_STATS,
-                () -> latestScan == null ? 0L : latestScan.getSkippedByPartitionAndStats());
-        metricGroup.gauge(
-                LAST_SKIPPED_BY_WHOLE_BUCKET_FILES_FILTER,
-                () -> latestScan == null ? 0L : latestScan.getSkippedByWholeBucketFiles());
         metricGroup.gauge(
                 LAST_SCAN_SKIPPED_TABLE_FILES,
                 () -> latestScan == null ? 0L : latestScan.getSkippedTableFiles());
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanStats.java b/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanStats.java
index e760282e687a5..700619c3680f0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanStats.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/metrics/ScanStats.java
@@ -25,23 +25,15 @@ public class ScanStats {
     // the unit is milliseconds
     private final long duration;
     private final long scannedManifests;
-    private final long skippedByPartitionAndStats;
 
-    private final long skippedByWholeBucketFiles;
     private final long skippedTableFiles;
     private final long resultedTableFiles;
 
     public ScanStats(
-            long duration,
-            long scannedManifests,
-            long skippedByPartitionAndStats,
-            long skippedByWholeBucketFiles,
-            long resultedTableFiles) {
+            long duration, long scannedManifests, long skippedTableFiles, long resultedTableFiles) {
         this.duration = duration;
         this.scannedManifests = scannedManifests;
-        this.skippedByPartitionAndStats = skippedByPartitionAndStats;
-        this.skippedByWholeBucketFiles = skippedByWholeBucketFiles;
-        this.skippedTableFiles = skippedByPartitionAndStats + skippedByWholeBucketFiles;
+        this.skippedTableFiles = skippedTableFiles;
         this.resultedTableFiles = resultedTableFiles;
     }
 
@@ -60,16 +52,6 @@ protected long getResultedTableFiles() {
         return resultedTableFiles;
     }
 
-    @VisibleForTesting
-    protected long getSkippedByPartitionAndStats() {
-        return skippedByPartitionAndStats;
-    }
-
-    @VisibleForTesting
-    protected long getSkippedByWholeBucketFiles() {
-        return skippedByWholeBucketFiles;
-    }
-
     @VisibleForTesting
     protected long getDuration() {
         return duration;
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/sink/TableCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/sink/TableCommitImpl.java
index b4f8fa47dbb1e..73c55942a56aa 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/sink/TableCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/sink/TableCommitImpl.java
@@ -68,7 +68,7 @@
 import static org.apache.paimon.table.sink.BatchWriteBuilder.COMMIT_IDENTIFIER;
 import static org.apache.paimon.utils.ManifestReadThreadPool.getExecutorService;
 import static org.apache.paimon.utils.Preconditions.checkState;
-import static org.apache.paimon.utils.ThreadPoolUtils.randomlyExecute;
+import static org.apache.paimon.utils.ThreadPoolUtils.randomlyExecuteSequentialReturn;
 
 /** An abstraction layer above {@link FileStoreCommit} to provide snapshot commit and expiration. */
 public class TableCommitImpl implements InnerTableCommit {
@@ -292,7 +292,7 @@ private void checkFilesExistence(List<ManifestCommittable> committables) {
 
         List<Path> nonExistFiles =
                 Lists.newArrayList(
-                        randomlyExecute(
+                        randomlyExecuteSequentialReturn(
                                 getExecutorService(null),
                                 f -> nonExists.test(f) ? singletonList(f) : emptyList(),
                                 files));
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
index d3e8a2adb6979..635802cc9dcbb 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
@@ -51,7 +51,7 @@ public DataTableBatchScan(
         this.hasNext = true;
         this.defaultValueAssigner = defaultValueAssigner;
         if (pkTable && (options.deletionVectorsEnabled() || options.mergeEngine() == FIRST_ROW)) {
-            snapshotReader.withLevelFilter(level -> level > 0);
+            snapshotReader.withLevelFilter(level -> level > 0).enableValueFilter();
         }
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/IncrementalStartingScanner.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/IncrementalStartingScanner.java
index 358d86cbe948a..9bfb54f2cf608 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/IncrementalStartingScanner.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/IncrementalStartingScanner.java
@@ -31,7 +31,6 @@
 import org.apache.paimon.table.source.ScanMode;
 import org.apache.paimon.table.source.Split;
 import org.apache.paimon.table.source.SplitGenerator;
-import org.apache.paimon.utils.ManifestReadThreadPool;
 import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.SnapshotManager;
 
@@ -50,6 +49,7 @@
 import java.util.stream.Collectors;
 import java.util.stream.LongStream;
 
+import static org.apache.paimon.utils.ManifestReadThreadPool.randomlyExecuteSequentialReturn;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
 
 /** {@link StartingScanner} for incremental changes by snapshot. */
@@ -84,7 +84,7 @@ public Result scan(SnapshotReader reader) {
                         .collect(Collectors.toList());
 
         Iterator<ManifestFileMeta> manifests =
-                ManifestReadThreadPool.randomlyExecute(
+                randomlyExecuteSequentialReturn(
                         id -> {
                             Snapshot snapshot = snapshotManager.snapshot(id);
                             switch (scanMode) {
@@ -111,7 +111,7 @@ public Result scan(SnapshotReader reader) {
                         reader.parallelism());
 
         Iterator<ManifestEntry> entries =
-                ManifestReadThreadPool.randomlyExecute(
+                randomlyExecuteSequentialReturn(
                         reader::readManifest, Lists.newArrayList(manifests), reader.parallelism());
 
         while (entries.hasNext()) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
index b59cf98bbb4c2..f3e0a92b8fc75 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReader.java
@@ -77,6 +77,8 @@ public interface SnapshotReader {
 
     SnapshotReader withLevelFilter(Filter<Integer> levelFilter);
 
+    SnapshotReader enableValueFilter();
+
     SnapshotReader withManifestEntryFilter(Filter<ManifestEntry> filter);
 
     SnapshotReader withBucket(int bucket);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
index 7ce537ee52ec1..ce01bdba94476 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
@@ -234,6 +234,12 @@ public SnapshotReader withLevelFilter(Filter<Integer> levelFilter) {
         return this;
     }
 
+    @Override
+    public SnapshotReader enableValueFilter() {
+        scan.enableValueFilter();
+        return this;
+    }
+
     @Override
     public SnapshotReader withManifestEntryFilter(Filter<ManifestEntry> filter) {
         scan.withManifestEntryFilter(filter);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
index e56ee90412ceb..b0cbe0772b5e0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
@@ -319,6 +319,12 @@ public SnapshotReader withLevelFilter(Filter<Integer> levelFilter) {
             return this;
         }
 
+        @Override
+        public SnapshotReader enableValueFilter() {
+            wrapped.enableValueFilter();
+            return this;
+        }
+
         @Override
         public SnapshotReader withManifestEntryFilter(Filter<ManifestEntry> filter) {
             wrapped.withManifestEntryFilter(filter);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
index e28ae3760534f..deb149791c8ff 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
@@ -120,7 +120,8 @@ public List<String> primaryKeys() {
     public SnapshotReader newSnapshotReader() {
         if (wrapped.schema().primaryKeys().size() > 0) {
             return wrapped.newSnapshotReader()
-                    .withLevelFilter(level -> level == coreOptions().numLevels() - 1);
+                    .withLevelFilter(level -> level == coreOptions().numLevels() - 1)
+                    .enableValueFilter();
         } else {
             return wrapped.newSnapshotReader();
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/ManifestReadThreadPool.java b/paimon-core/src/main/java/org/apache/paimon/utils/ManifestReadThreadPool.java
index d967e778fe996..49fcfc8bd9094 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/ManifestReadThreadPool.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/ManifestReadThreadPool.java
@@ -54,9 +54,9 @@ public static <T, U> Iterable<T> sequentialBatchedExecute(
     }
 
     /** This method aims to parallel process tasks with randomly but return values sequentially. */
-    public static <T, U> Iterator<T> randomlyExecute(
+    public static <T, U> Iterator<T> randomlyExecuteSequentialReturn(
             Function<U, List<T>> processor, List<U> input, @Nullable Integer threadNum) {
         ThreadPoolExecutor executor = getExecutorService(threadNum);
-        return ThreadPoolUtils.randomlyExecute(executor, processor, input);
+        return ThreadPoolUtils.randomlyExecuteSequentialReturn(executor, processor, input);
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsCache.java b/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsCache.java
index 8c490e008baa1..1c9d9664f22f9 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsCache.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsCache.java
@@ -66,11 +66,12 @@ public List<V> read(
             K key,
             @Nullable Long fileSize,
             Filter<InternalRow> loadFilter,
-            Filter<InternalRow> readFilter)
+            Filter<InternalRow> readFilter,
+            Filter<V> readVFilter)
             throws IOException {
         Segments segments = cache.getIfPresents(key);
         if (segments != null) {
-            return readFromSegments(segments, readFilter);
+            return readFromSegments(segments, readFilter, readVFilter);
         } else {
             if (fileSize == null) {
                 fileSize = fileSizeFunction.apply(key);
@@ -78,15 +79,16 @@ public List<V> read(
             if (fileSize <= cache.maxElementSize()) {
                 segments = readSegments(key, fileSize, loadFilter);
                 cache.put(key, segments);
-                return readFromSegments(segments, readFilter);
+                return readFromSegments(segments, readFilter, readVFilter);
             } else {
                 return readFromIterator(
-                        reader.apply(key, fileSize), projectedSerializer, readFilter);
+                        reader.apply(key, fileSize), projectedSerializer, readFilter, readVFilter);
             }
         }
     }
 
-    private List<V> readFromSegments(Segments segments, Filter<InternalRow> readFilter)
+    private List<V> readFromSegments(
+            Segments segments, Filter<InternalRow> readFilter, Filter<V> readVFilter)
             throws IOException {
         InternalRowSerializer formatSerializer = this.formatSerializer.get();
         List<V> entries = new ArrayList<>();
@@ -98,7 +100,10 @@ private List<V> readFromSegments(Segments segments, Filter<InternalRow> readFilt
             try {
                 formatSerializer.mapFromPages(binaryRow, view);
                 if (readFilter.test(binaryRow)) {
-                    entries.add(projectedSerializer.fromRow(binaryRow));
+                    V v = projectedSerializer.fromRow(binaryRow);
+                    if (readVFilter.test(v)) {
+                        entries.add(v);
+                    }
                 }
             } catch (EOFException e) {
                 return entries;
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsFile.java b/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsFile.java
index 3c261f4103246..b0bea8e66a82d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/ObjectsFile.java
@@ -94,7 +94,8 @@ public List<T> read(String fileName) {
     }
 
     public List<T> read(String fileName, @Nullable Long fileSize) {
-        return read(fileName, fileSize, Filter.alwaysTrue(), Filter.alwaysTrue());
+        return read(
+                fileName, fileSize, Filter.alwaysTrue(), Filter.alwaysTrue(), Filter.alwaysTrue());
     }
 
     public List<T> readWithIOException(String fileName) throws IOException {
@@ -103,7 +104,8 @@ public List<T> readWithIOException(String fileName) throws IOException {
 
     public List<T> readWithIOException(String fileName, @Nullable Long fileSize)
             throws IOException {
-        return readWithIOException(fileName, fileSize, Filter.alwaysTrue(), Filter.alwaysTrue());
+        return readWithIOException(
+                fileName, fileSize, Filter.alwaysTrue(), Filter.alwaysTrue(), Filter.alwaysTrue());
     }
 
     public boolean exists(String fileName) {
@@ -118,9 +120,10 @@ public List<T> read(
             String fileName,
             @Nullable Long fileSize,
             Filter<InternalRow> loadFilter,
-            Filter<InternalRow> readFilter) {
+            Filter<InternalRow> readFilter,
+            Filter<T> readTFilter) {
         try {
-            return readWithIOException(fileName, fileSize, loadFilter, readFilter);
+            return readWithIOException(fileName, fileSize, loadFilter, readFilter, readTFilter);
         } catch (IOException e) {
             throw new RuntimeException("Failed to read " + fileName, e);
         }
@@ -130,14 +133,16 @@ private List<T> readWithIOException(
             String fileName,
             @Nullable Long fileSize,
             Filter<InternalRow> loadFilter,
-            Filter<InternalRow> readFilter)
+            Filter<InternalRow> readFilter,
+            Filter<T> readTFilter)
             throws IOException {
         Path path = pathFactory.toPath(fileName);
         if (cache != null) {
-            return cache.read(path, fileSize, loadFilter, readFilter);
+            return cache.read(path, fileSize, loadFilter, readFilter, readTFilter);
         }
 
-        return readFromIterator(createIterator(path, fileSize), serializer, readFilter);
+        return readFromIterator(
+                createIterator(path, fileSize), serializer, readFilter, readTFilter);
     }
 
     public String writeWithoutRolling(Collection<T> records) {
@@ -184,13 +189,17 @@ public void delete(String fileName) {
     public static <V> List<V> readFromIterator(
             CloseableIterator<InternalRow> inputIterator,
             ObjectSerializer<V> serializer,
-            Filter<InternalRow> readFilter) {
+            Filter<InternalRow> readFilter,
+            Filter<V> readVFilter) {
         try (CloseableIterator<InternalRow> iterator = inputIterator) {
             List<V> result = new ArrayList<>();
             while (iterator.hasNext()) {
                 InternalRow row = iterator.next();
                 if (readFilter.test(row)) {
-                    result.add(serializer.fromRow(row));
+                    V v = serializer.fromRow(row);
+                    if (readVFilter.test(v)) {
+                        result.add(v);
+                    }
                 }
             }
             return result;
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/metrics/ScanMetricsTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/metrics/ScanMetricsTest.java
index 2b9d0e0cb7288..a0427d95cab18 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/metrics/ScanMetricsTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/metrics/ScanMetricsTest.java
@@ -48,9 +48,7 @@ public void testGenericMetricsRegistration() {
                         ScanMetrics.SCAN_DURATION,
                         ScanMetrics.LAST_SCANNED_MANIFESTS,
                         ScanMetrics.LAST_SCAN_SKIPPED_TABLE_FILES,
-                        ScanMetrics.LAST_SCAN_RESULTED_TABLE_FILES,
-                        ScanMetrics.LAST_SKIPPED_BY_PARTITION_AND_STATS,
-                        ScanMetrics.LAST_SKIPPED_BY_WHOLE_BUCKET_FILES_FILTER);
+                        ScanMetrics.LAST_SCAN_RESULTED_TABLE_FILES);
     }
 
     /** Tests that the metrics are updated properly. */
@@ -66,14 +64,6 @@ public void testMetricsAreUpdated() {
                 (Histogram) registeredGenericMetrics.get(ScanMetrics.SCAN_DURATION);
         Gauge<Long> lastScannedManifests =
                 (Gauge<Long>) registeredGenericMetrics.get(ScanMetrics.LAST_SCANNED_MANIFESTS);
-        Gauge<Long> lastSkippedByPartitionAndStats =
-                (Gauge<Long>)
-                        registeredGenericMetrics.get(
-                                ScanMetrics.LAST_SKIPPED_BY_PARTITION_AND_STATS);
-        Gauge<Long> lastSkippedByWholeBucketFilesFilter =
-                (Gauge<Long>)
-                        registeredGenericMetrics.get(
-                                ScanMetrics.LAST_SKIPPED_BY_WHOLE_BUCKET_FILES_FILTER);
         Gauge<Long> lastScanSkippedTableFiles =
                 (Gauge<Long>)
                         registeredGenericMetrics.get(ScanMetrics.LAST_SCAN_SKIPPED_TABLE_FILES);
@@ -85,8 +75,6 @@ public void testMetricsAreUpdated() {
         assertThat(scanDuration.getCount()).isEqualTo(0);
         assertThat(scanDuration.getStatistics().size()).isEqualTo(0);
         assertThat(lastScannedManifests.getValue()).isEqualTo(0);
-        assertThat(lastSkippedByPartitionAndStats.getValue()).isEqualTo(0);
-        assertThat(lastSkippedByWholeBucketFilesFilter.getValue()).isEqualTo(0);
         assertThat(lastScanSkippedTableFiles.getValue()).isEqualTo(0);
         assertThat(lastScanResultedTableFiles.getValue()).isEqualTo(0);
 
@@ -104,9 +92,7 @@ public void testMetricsAreUpdated() {
         assertThat(scanDuration.getStatistics().getMax()).isEqualTo(200);
         assertThat(scanDuration.getStatistics().getStdDev()).isEqualTo(0);
         assertThat(lastScannedManifests.getValue()).isEqualTo(20);
-        assertThat(lastSkippedByPartitionAndStats.getValue()).isEqualTo(25);
-        assertThat(lastSkippedByWholeBucketFilesFilter.getValue()).isEqualTo(32);
-        assertThat(lastScanSkippedTableFiles.getValue()).isEqualTo(57);
+        assertThat(lastScanSkippedTableFiles.getValue()).isEqualTo(25);
         assertThat(lastScanResultedTableFiles.getValue()).isEqualTo(10);
 
         // report again
@@ -123,19 +109,17 @@ public void testMetricsAreUpdated() {
         assertThat(scanDuration.getStatistics().getMax()).isEqualTo(500);
         assertThat(scanDuration.getStatistics().getStdDev()).isCloseTo(212.132, offset(0.001));
         assertThat(lastScannedManifests.getValue()).isEqualTo(22);
-        assertThat(lastSkippedByPartitionAndStats.getValue()).isEqualTo(30);
-        assertThat(lastSkippedByWholeBucketFilesFilter.getValue()).isEqualTo(33);
-        assertThat(lastScanSkippedTableFiles.getValue()).isEqualTo(63);
+        assertThat(lastScanSkippedTableFiles.getValue()).isEqualTo(30);
         assertThat(lastScanResultedTableFiles.getValue()).isEqualTo(8);
     }
 
     private void reportOnce(ScanMetrics scanMetrics) {
-        ScanStats scanStats = new ScanStats(200, 20, 25, 32, 10);
+        ScanStats scanStats = new ScanStats(200, 20, 25, 10);
         scanMetrics.reportScan(scanStats);
     }
 
     private void reportAgain(ScanMetrics scanMetrics) {
-        ScanStats scanStats = new ScanStats(500, 22, 30, 33, 8);
+        ScanStats scanStats = new ScanStats(500, 22, 30, 8);
         scanMetrics.reportScan(scanStats);
     }
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index 133913c487cdf..51c8b328dfc6a 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -121,17 +121,6 @@
 /** Tests for {@link PrimaryKeyFileStoreTable}. */
 public class PrimaryKeyFileStoreTableTest extends FileStoreTableTestBase {
 
-    protected static final RowType COMPATIBILITY_ROW_TYPE =
-            RowType.of(
-                    new DataType[] {
-                        DataTypes.INT(),
-                        DataTypes.INT(),
-                        DataTypes.BIGINT(),
-                        DataTypes.BINARY(1),
-                        DataTypes.VARBINARY(1)
-                    },
-                    new String[] {"pt", "a", "b", "c", "d"});
-
     protected static final Function<InternalRow, String> COMPATIBILITY_BATCH_ROW_TO_STRING =
             rowData ->
                     rowData.getInt(0)
@@ -144,12 +133,6 @@ public class PrimaryKeyFileStoreTableTest extends FileStoreTableTestBase {
                             + "|"
                             + new String(rowData.getBinary(4));
 
-    protected static final Function<InternalRow, String> COMPATIBILITY_CHANGELOG_ROW_TO_STRING =
-            rowData ->
-                    rowData.getRowKind().shortString()
-                            + " "
-                            + COMPATIBILITY_BATCH_ROW_TO_STRING.apply(rowData);
-
     @Test
     public void testMultipleWriters() throws Exception {
         WriteSelector selector =
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/ObjectsCacheTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/ObjectsCacheTest.java
index 8a4f0b0612e71..9d3275e3ab487 100644
--- a/paimon-core/src/test/java/org/apache/paimon/utils/ObjectsCacheTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/ObjectsCacheTest.java
@@ -58,17 +58,23 @@ public void test() throws IOException {
 
         // test empty
         map.put("k1", Collections.emptyList());
-        List<String> values = cache.read("k1", null, Filter.alwaysTrue(), Filter.alwaysTrue());
+        List<String> values =
+                cache.read(
+                        "k1", null, Filter.alwaysTrue(), Filter.alwaysTrue(), Filter.alwaysTrue());
         assertThat(values).isEmpty();
 
         // test values
         List<String> expect = Arrays.asList("v1", "v2", "v3");
         map.put("k2", expect);
-        values = cache.read("k2", null, Filter.alwaysTrue(), Filter.alwaysTrue());
+        values =
+                cache.read(
+                        "k2", null, Filter.alwaysTrue(), Filter.alwaysTrue(), Filter.alwaysTrue());
         assertThat(values).containsExactlyElementsOf(expect);
 
         // test cache
-        values = cache.read("k2", null, Filter.alwaysTrue(), Filter.alwaysTrue());
+        values =
+                cache.read(
+                        "k2", null, Filter.alwaysTrue(), Filter.alwaysTrue(), Filter.alwaysTrue());
         assertThat(values).containsExactlyElementsOf(expect);
 
         // test filter
@@ -77,7 +83,8 @@ public void test() throws IOException {
                         "k2",
                         null,
                         Filter.alwaysTrue(),
-                        r -> r.getString(0).toString().endsWith("2"));
+                        r -> r.getString(0).toString().endsWith("2"),
+                        Filter.alwaysTrue());
         assertThat(values).containsExactly("v2");
 
         // test load filter
@@ -88,6 +95,7 @@ public void test() throws IOException {
                         "k3",
                         null,
                         r -> r.getString(0).toString().endsWith("2"),
+                        Filter.alwaysTrue(),
                         Filter.alwaysTrue());
         assertThat(values).containsExactly("v2");
 
@@ -99,6 +107,7 @@ public void test() throws IOException {
                         "k4",
                         null,
                         r -> r.getString(0).toString().endsWith("5"),
+                        Filter.alwaysTrue(),
                         Filter.alwaysTrue());
         assertThat(values).isEmpty();
 
@@ -117,6 +126,7 @@ public void test() throws IOException {
                                                         k,
                                                         null,
                                                         Filter.alwaysTrue(),
+                                                        Filter.alwaysTrue(),
                                                         Filter.alwaysTrue()))
                                         .containsExactly(k);
                             } catch (IOException e) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
index b7eb1d625ce3b..559976921e2e0 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/ContinuousFileStoreSource.java
@@ -77,7 +77,7 @@ public SplitEnumerator<FileStoreSourceSplit, PendingSplitsCheckpoint> restoreEnu
             nextSnapshotId = checkpoint.currentSnapshotId();
             splits = checkpoint.splits();
         }
-        StreamTableScan scan = readBuilder.dropStats().newStreamScan();
+        StreamTableScan scan = readBuilder.newStreamScan();
         if (metricGroup(context) != null) {
             ((StreamDataTableScan) scan)
                     .withMetricsRegistry(new FlinkMetricRegistry(context.metricGroup()));
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
index a648bfba607d4..b3dcd4840cc1b 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
@@ -178,7 +178,7 @@ private ReadBuilder createReadBuilder() {
         if (limit != null) {
             readBuilder.withLimit(limit.intValue());
         }
-        return readBuilder;
+        return readBuilder.dropStats();
     }
 
     private DataStream<RowData> buildStaticFileSource() {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
index 9bfd36fdfaa81..12b579589d0fe 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkTableSource.java
@@ -31,6 +31,7 @@
 import org.apache.paimon.table.DataTable;
 import org.apache.paimon.table.Table;
 import org.apache.paimon.table.source.Split;
+import org.apache.paimon.table.source.TableScan;
 
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
@@ -172,12 +173,7 @@ protected Integer inferSourceParallelism(StreamExecutionEnvironment env) {
     protected void scanSplitsForInference() {
         if (splitStatistics == null) {
             if (table instanceof DataTable) {
-                List<PartitionEntry> partitionEntries =
-                        table.newReadBuilder()
-                                .withFilter(predicate)
-                                .dropStats()
-                                .newScan()
-                                .listPartitionEntries();
+                List<PartitionEntry> partitionEntries = newTableScan().listPartitionEntries();
                 long totalSize = 0;
                 long rowCount = 0;
                 for (PartitionEntry entry : partitionEntries) {
@@ -188,13 +184,7 @@ protected void scanSplitsForInference() {
                 splitStatistics =
                         new SplitStatistics((int) (totalSize / splitTargetSize + 1), rowCount);
             } else {
-                List<Split> splits =
-                        table.newReadBuilder()
-                                .withFilter(predicate)
-                                .dropStats()
-                                .newScan()
-                                .plan()
-                                .splits();
+                List<Split> splits = newTableScan().plan().splits();
                 splitStatistics =
                         new SplitStatistics(
                                 splits.size(), splits.stream().mapToLong(Split::rowCount).sum());
@@ -202,6 +192,10 @@ protected void scanSplitsForInference() {
         }
     }
 
+    private TableScan newTableScan() {
+        return table.newReadBuilder().dropStats().withFilter(predicate).newScan();
+    }
+
     /** Split statistics for inferring row count and parallelism size. */
     protected static class SplitStatistics {
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
index c388a6dccbbce..af425aab5e469 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/StaticFileStoreSource.java
@@ -87,7 +87,7 @@ public SplitEnumerator<FileStoreSourceSplit, PendingSplitsCheckpoint> restoreEnu
 
     private List<FileStoreSourceSplit> getSplits(SplitEnumeratorContext context) {
         FileStoreSourceSplitGenerator splitGenerator = new FileStoreSourceSplitGenerator();
-        TableScan scan = readBuilder.dropStats().newScan();
+        TableScan scan = readBuilder.newScan();
         // register scan metrics
         if (context.metricGroup() != null) {
             ((InnerTableScan) scan)
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
index f21922670471b..3805f6f8c536e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
@@ -106,7 +106,7 @@ public MonitorFunction(
 
     @Override
     public void initializeState(FunctionInitializationContext context) throws Exception {
-        this.scan = readBuilder.dropStats().newStreamScan();
+        this.scan = readBuilder.newStreamScan();
 
         this.checkpointState =
                 context.getOperatorStateStore()
diff --git a/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/utils/HiveSplitGenerator.java b/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/utils/HiveSplitGenerator.java
index 33cbc19e03262..144afab8e1fa8 100644
--- a/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/utils/HiveSplitGenerator.java
+++ b/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/utils/HiveSplitGenerator.java
@@ -96,7 +96,8 @@ public static InputSplit[] generateSplits(FileStoreTable table, JobConf jobConf)
                     scan.withFilter(PredicateBuilder.and(predicatePerPartition));
                 }
             }
-            scan.plan()
+            scan.dropStats()
+                    .plan()
                     .splits()
                     .forEach(
                             split ->
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/ColumnPruningAndPushDown.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/ColumnPruningAndPushDown.scala
index 95c8f4b3a9a8f..f29c146b775a6 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/ColumnPruningAndPushDown.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/ColumnPruningAndPushDown.scala
@@ -62,7 +62,7 @@ trait ColumnPruningAndPushDown extends Scan with Logging {
       _readBuilder.withFilter(pushedPredicate)
     }
     pushDownLimit.foreach(_readBuilder.withLimit)
-    _readBuilder
+    _readBuilder.dropStats()
   }
 
   final def metadataColumns: Seq[PaimonMetadataColumn] = {
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonAnalyzeTableColumnCommand.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonAnalyzeTableColumnCommand.scala
index 19f73cb6cc683..9a88ca2e4c3ab 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonAnalyzeTableColumnCommand.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonAnalyzeTableColumnCommand.scala
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.spark.commands
 
+import org.apache.paimon.manifest.PartitionEntry
 import org.apache.paimon.schema.TableSchema
 import org.apache.paimon.spark.SparkTable
 import org.apache.paimon.spark.leafnode.PaimonLeafRunnableCommand
@@ -64,11 +65,9 @@ case class PaimonAnalyzeTableColumnCommand(
     // compute stats
     val totalSize = table
       .newScan()
-      .plan()
-      .splits()
+      .listPartitionEntries()
       .asScala
-      .flatMap { case split: DataSplit => split.dataFiles().asScala }
-      .map(_.fileSize())
+      .map(_.fileSizeInBytes())
       .sum
     val (mergedRecordCount, colStats) =
       PaimonStatsUtils.computeColumnStats(sparkSession, relation, attributes)
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/sources/StreamHelper.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/sources/StreamHelper.scala
index b44a66fce3ff1..7e61d71ac1835 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/sources/StreamHelper.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/sources/StreamHelper.scala
@@ -44,7 +44,8 @@ private[spark] trait StreamHelper {
 
   var lastTriggerMillis: Long
 
-  private lazy val streamScan: StreamDataTableScan = table.newStreamScan()
+  private lazy val streamScan: StreamDataTableScan =
+    table.newStreamScan().dropStats().asInstanceOf[StreamDataTableScan]
 
   private lazy val partitionSchema: StructType =
     SparkTypeUtils.fromPaimonRowType(TypeUtils.project(table.rowType(), table.partitionKeys()))

From ebef050348de90f91193314079a6fb08e785c985 Mon Sep 17 00:00:00 2001
From: LsomeYeah <94825748+LsomeYeah@users.noreply.github.com>
Date: Tue, 19 Nov 2024 20:19:36 +0800
Subject: [PATCH 033/157] [flink] change env.fromData to fromElements for
 compatibility with flink 1.18 and lower versions (#4541)

---
 .../procedure/RemoveOrphanFilesProcedure.java |  62 +++-
 .../flink/RemoveOrphanFilesActionITCase.java  | 299 +++++++++++++++
 .../flink/RemoveOrphanFilesActionITCase.java  |  25 ++
 .../flink/orphan/FlinkOrphanFilesClean.java   |   2 +-
 .../action/RemoveOrphanFilesActionITCase.java | 323 +----------------
 .../RemoveOrphanFilesActionITCaseBase.java    | 341 ++++++++++++++++++
 6 files changed, 719 insertions(+), 333 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
 create mode 100644 paimon-flink/paimon-flink-1.19/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java

diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
index c5fa7b7ba34ae..7695c510b1dc7 100644
--- a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
@@ -20,9 +20,12 @@
 
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.flink.orphan.FlinkOrphanFilesClean;
+import org.apache.paimon.operation.LocalOrphanFilesClean;
 
 import org.apache.flink.table.procedure.ProcedureContext;
 
+import java.util.Locale;
+
 import static org.apache.paimon.operation.OrphanFilesClean.createFileCleaner;
 import static org.apache.paimon.operation.OrphanFilesClean.olderThanMillis;
 
@@ -66,20 +69,57 @@ public String[] call(
             boolean dryRun,
             Integer parallelism)
             throws Exception {
+        return call(procedureContext, tableId, olderThan, dryRun, parallelism, null);
+    }
+
+    public String[] call(
+            ProcedureContext procedureContext,
+            String tableId,
+            String olderThan,
+            boolean dryRun,
+            Integer parallelism,
+            String mode)
+            throws Exception {
         Identifier identifier = Identifier.fromString(tableId);
         String databaseName = identifier.getDatabaseName();
         String tableName = identifier.getObjectName();
-
-        long deleted =
-                FlinkOrphanFilesClean.executeDatabaseOrphanFiles(
-                        procedureContext.getExecutionEnvironment(),
-                        catalog,
-                        olderThanMillis(olderThan),
-                        createFileCleaner(catalog, dryRun),
-                        parallelism,
-                        databaseName,
-                        tableName);
-        return new String[] {String.valueOf(deleted)};
+        if (mode == null) {
+            mode = "DISTRIBUTED";
+        }
+        long deletedFiles;
+        try {
+            switch (mode.toUpperCase(Locale.ROOT)) {
+                case "DISTRIBUTED":
+                    deletedFiles =
+                            FlinkOrphanFilesClean.executeDatabaseOrphanFiles(
+                                    procedureContext.getExecutionEnvironment(),
+                                    catalog,
+                                    olderThanMillis(olderThan),
+                                    createFileCleaner(catalog, dryRun),
+                                    parallelism,
+                                    databaseName,
+                                    tableName);
+                    break;
+                case "LOCAL":
+                    deletedFiles =
+                            LocalOrphanFilesClean.executeDatabaseOrphanFiles(
+                                    catalog,
+                                    databaseName,
+                                    tableName,
+                                    olderThanMillis(olderThan),
+                                    createFileCleaner(catalog, dryRun),
+                                    parallelism);
+                    break;
+                default:
+                    throw new IllegalArgumentException(
+                            "Unknown mode: "
+                                    + mode
+                                    + ". Only 'DISTRIBUTED' and 'LOCAL' are supported.");
+            }
+            return new String[] {String.valueOf(deletedFiles)};
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
new file mode 100644
index 0000000000000..46b62b6bf3072
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
@@ -0,0 +1,299 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.flink.action.ActionITCaseBase;
+import org.apache.paimon.flink.action.RemoveOrphanFilesAction;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.schema.SchemaChange;
+import org.apache.paimon.schema.SchemaManager;
+import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.FileStoreTableFactory;
+import org.apache.paimon.table.sink.StreamTableCommit;
+import org.apache.paimon.table.sink.StreamTableWrite;
+import org.apache.paimon.table.sink.StreamWriteBuilder;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.RowType;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
+
+import org.apache.flink.types.Row;
+import org.apache.flink.util.CloseableIterator;
+import org.junit.jupiter.api.Test;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+import java.util.UUID;
+import java.util.concurrent.ThreadLocalRandom;
+
+import static org.apache.paimon.CoreOptions.SCAN_FALLBACK_BRANCH;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatCode;
+
+/** IT cases base for {@link RemoveOrphanFilesAction} in Flink 1.18. */
+public class RemoveOrphanFilesActionITCase extends ActionITCaseBase {
+    private static final String ORPHAN_FILE_1 = "bucket-0/orphan_file1";
+    private static final String ORPHAN_FILE_2 = "bucket-0/orphan_file2";
+
+    private FileStoreTable createTableAndWriteData(String tableName) throws Exception {
+        RowType rowType =
+                RowType.of(
+                        new DataType[] {DataTypes.BIGINT(), DataTypes.STRING()},
+                        new String[] {"k", "v"});
+
+        FileStoreTable table =
+                createFileStoreTable(
+                        tableName,
+                        rowType,
+                        Collections.emptyList(),
+                        Collections.singletonList("k"),
+                        Collections.emptyList(),
+                        Collections.emptyMap());
+
+        StreamWriteBuilder writeBuilder = table.newStreamWriteBuilder().withCommitUser(commitUser);
+        write = writeBuilder.newWrite();
+        commit = writeBuilder.newCommit();
+
+        writeData(rowData(1L, BinaryString.fromString("Hi")));
+
+        Path orphanFile1 = getOrphanFilePath(table, ORPHAN_FILE_1);
+        Path orphanFile2 = getOrphanFilePath(table, ORPHAN_FILE_2);
+
+        FileIO fileIO = table.fileIO();
+        fileIO.writeFile(orphanFile1, "a", true);
+        Thread.sleep(2000);
+        fileIO.writeFile(orphanFile2, "b", true);
+
+        return table;
+    }
+
+    private Path getOrphanFilePath(FileStoreTable table, String orphanFile) {
+        return new Path(table.location(), orphanFile);
+    }
+
+    @Test
+    public void testRunWithoutException() throws Exception {
+        createTableAndWriteData(tableName);
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                tableName));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format("CALL sys.remove_orphan_files('%s.%s')", database, tableName);
+
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withDryRun =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
+                        database, tableName);
+        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
+        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withOlderThan =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database, tableName);
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
+
+        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"));
+    }
+
+    @Test
+    public void testRemoveDatabaseOrphanFilesITCase() throws Exception {
+        createTableAndWriteData("tableName1");
+        createTableAndWriteData("tableName2");
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                "*"));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        args.add("--parallelism");
+        args.add("5");
+        RemoveOrphanFilesAction action3 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action3::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format("CALL sys.remove_orphan_files('%s.%s')", database, "*");
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withParallelism =
+                String.format("CALL sys.remove_orphan_files('%s.%s','',true,5)", database, "*");
+        CloseableIterator<Row> withParallelismCollect = executeSQL(withParallelism);
+        assertThat(ImmutableList.copyOf(withParallelismCollect)).containsOnly(Row.of("0"));
+
+        String withDryRun =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
+                        database, "*");
+        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
+        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("4"));
+
+        String withOlderThan =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database, "*");
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
+
+        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
+    }
+
+    @Test
+    public void testCleanWithBranch() throws Exception {
+        // create main branch
+        FileStoreTable table = createTableAndWriteData(tableName);
+
+        // create first branch and write some data
+        table.createBranch("br");
+        SchemaManager schemaManager = new SchemaManager(table.fileIO(), table.location(), "br");
+        TableSchema branchSchema =
+                schemaManager.commitChanges(SchemaChange.addColumn("v2", DataTypes.INT()));
+        Options branchOptions = new Options(branchSchema.options());
+        branchOptions.set(CoreOptions.BRANCH, "br");
+        branchSchema = branchSchema.copy(branchOptions.toMap());
+        FileStoreTable branchTable =
+                FileStoreTableFactory.create(table.fileIO(), table.location(), branchSchema);
+
+        String commitUser = UUID.randomUUID().toString();
+        StreamTableWrite write = branchTable.newWrite(commitUser);
+        StreamTableCommit commit = branchTable.newCommit(commitUser);
+        write.write(GenericRow.of(2L, BinaryString.fromString("Hello"), 20));
+        commit.commit(1, write.prepareCommit(false, 1));
+        write.close();
+        commit.close();
+
+        // create orphan file in snapshot directory of first branch
+        Path orphanFile3 = new Path(table.location(), "branch/branch-br/snapshot/orphan_file3");
+        branchTable.fileIO().writeFile(orphanFile3, "x", true);
+
+        // create second branch, which is empty
+        table.createBranch("br2");
+
+        // create orphan file in snapshot directory of second branch
+        Path orphanFile4 = new Path(table.location(), "branch/branch-br2/snapshot/orphan_file4");
+        branchTable.fileIO().writeFile(orphanFile4, "y", true);
+
+        if (ThreadLocalRandom.current().nextBoolean()) {
+            executeSQL(
+                    String.format(
+                            "ALTER TABLE `%s`.`%s` SET ('%s' = 'br')",
+                            database, tableName, SCAN_FALLBACK_BRANCH.key()),
+                    false,
+                    true);
+        }
+        String procedure =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database, "*");
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(procedure));
+        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
+    }
+
+    @Test
+    public void testRunWithMode() throws Exception {
+        createTableAndWriteData(tableName);
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                tableName));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format("CALL sys.remove_orphan_files('%s.%s')", database, tableName);
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withLocalMode =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'local')",
+                        database, tableName);
+        ImmutableList<Row> actualLocalRunDeleteFile =
+                ImmutableList.copyOf(executeSQL(withLocalMode));
+        assertThat(actualLocalRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withDistributedMode =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'distributed')",
+                        database, tableName);
+        ImmutableList<Row> actualDistributedRunDeleteFile =
+                ImmutableList.copyOf(executeSQL(withDistributedMode));
+        assertThat(actualDistributedRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withInvalidMode =
+                String.format(
+                        "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'unknown')",
+                        database, tableName);
+        assertThatCode(() -> executeSQL(withInvalidMode))
+                .isInstanceOf(RuntimeException.class)
+                .hasMessageContaining("Unknown mode");
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.19/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java b/paimon-flink/paimon-flink-1.19/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
new file mode 100644
index 0000000000000..e1be410b8cb15
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.19/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
@@ -0,0 +1,25 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink;
+
+import org.apache.paimon.flink.action.RemoveOrphanFilesAction;
+import org.apache.paimon.flink.action.RemoveOrphanFilesActionITCaseBase;
+
+/** IT cases base for {@link RemoveOrphanFilesAction} in Flink 1.19. */
+public class RemoveOrphanFilesActionITCase extends RemoveOrphanFilesActionITCaseBase {}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
index f50414620551d..61bebca24af45 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
@@ -279,7 +279,7 @@ public void processElement2(StreamRecord<String> element) {
                                 });
 
         if (deletedInLocal.get() != 0) {
-            deleted = deleted.union(env.fromData(deletedInLocal.get()));
+            deleted = deleted.union(env.fromElements(deletedInLocal.get()));
         }
         return deleted;
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCase.java
index 938a8ce1be7a2..a92e529aa2cf2 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCase.java
@@ -18,324 +18,5 @@
 
 package org.apache.paimon.flink.action;
 
-import org.apache.paimon.CoreOptions;
-import org.apache.paimon.data.BinaryString;
-import org.apache.paimon.data.GenericRow;
-import org.apache.paimon.fs.FileIO;
-import org.apache.paimon.fs.Path;
-import org.apache.paimon.options.Options;
-import org.apache.paimon.schema.SchemaChange;
-import org.apache.paimon.schema.SchemaManager;
-import org.apache.paimon.schema.TableSchema;
-import org.apache.paimon.table.FileStoreTable;
-import org.apache.paimon.table.FileStoreTableFactory;
-import org.apache.paimon.table.sink.StreamTableCommit;
-import org.apache.paimon.table.sink.StreamTableWrite;
-import org.apache.paimon.table.sink.StreamWriteBuilder;
-import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypes;
-import org.apache.paimon.types.RowType;
-
-import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
-
-import org.apache.flink.types.Row;
-import org.apache.flink.util.CloseableIterator;
-import org.junit.jupiter.params.ParameterizedTest;
-import org.junit.jupiter.params.provider.ValueSource;
-
-import java.util.ArrayList;
-import java.util.Arrays;
-import java.util.Collections;
-import java.util.List;
-import java.util.UUID;
-import java.util.concurrent.ThreadLocalRandom;
-
-import static org.apache.paimon.CoreOptions.SCAN_FALLBACK_BRANCH;
-import static org.assertj.core.api.Assertions.assertThat;
-import static org.assertj.core.api.Assertions.assertThatCode;
-
-/** IT cases for {@link RemoveOrphanFilesAction}. */
-public class RemoveOrphanFilesActionITCase extends ActionITCaseBase {
-
-    private static final String ORPHAN_FILE_1 = "bucket-0/orphan_file1";
-    private static final String ORPHAN_FILE_2 = "bucket-0/orphan_file2";
-
-    private FileStoreTable createTableAndWriteData(String tableName) throws Exception {
-        RowType rowType =
-                RowType.of(
-                        new DataType[] {DataTypes.BIGINT(), DataTypes.STRING()},
-                        new String[] {"k", "v"});
-
-        FileStoreTable table =
-                createFileStoreTable(
-                        tableName,
-                        rowType,
-                        Collections.emptyList(),
-                        Collections.singletonList("k"),
-                        Collections.emptyList(),
-                        Collections.emptyMap());
-
-        StreamWriteBuilder writeBuilder = table.newStreamWriteBuilder().withCommitUser(commitUser);
-        write = writeBuilder.newWrite();
-        commit = writeBuilder.newCommit();
-
-        writeData(rowData(1L, BinaryString.fromString("Hi")));
-
-        Path orphanFile1 = getOrphanFilePath(table, ORPHAN_FILE_1);
-        Path orphanFile2 = getOrphanFilePath(table, ORPHAN_FILE_2);
-
-        FileIO fileIO = table.fileIO();
-        fileIO.writeFile(orphanFile1, "a", true);
-        Thread.sleep(2000);
-        fileIO.writeFile(orphanFile2, "b", true);
-
-        return table;
-    }
-
-    private Path getOrphanFilePath(FileStoreTable table, String orphanFile) {
-        return new Path(table.location(), orphanFile);
-    }
-
-    @ParameterizedTest
-    @ValueSource(booleans = {true, false})
-    public void testRunWithoutException(boolean isNamedArgument) throws Exception {
-        createTableAndWriteData(tableName);
-
-        List<String> args =
-                new ArrayList<>(
-                        Arrays.asList(
-                                "remove_orphan_files",
-                                "--warehouse",
-                                warehouse,
-                                "--database",
-                                database,
-                                "--table",
-                                tableName));
-        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action1::run).doesNotThrowAnyException();
-
-        args.add("--older_than");
-        args.add("2023-12-31 23:59:59");
-        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action2::run).doesNotThrowAnyException();
-
-        String withoutOlderThan =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
-                                : "CALL sys.remove_orphan_files('%s.%s')",
-                        database,
-                        tableName);
-        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
-        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
-
-        String withDryRun =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true)"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
-                        database,
-                        tableName);
-        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
-        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("2"));
-
-        String withOlderThan =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
-                        database,
-                        tableName);
-        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
-
-        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"));
-    }
-
-    @ParameterizedTest
-    @ValueSource(booleans = {true, false})
-    public void testRemoveDatabaseOrphanFilesITCase(boolean isNamedArgument) throws Exception {
-        createTableAndWriteData("tableName1");
-        createTableAndWriteData("tableName2");
-
-        List<String> args =
-                new ArrayList<>(
-                        Arrays.asList(
-                                "remove_orphan_files",
-                                "--warehouse",
-                                warehouse,
-                                "--database",
-                                database,
-                                "--table",
-                                "*"));
-        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action1::run).doesNotThrowAnyException();
-
-        args.add("--older_than");
-        args.add("2023-12-31 23:59:59");
-        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action2::run).doesNotThrowAnyException();
-
-        args.add("--parallelism");
-        args.add("5");
-        RemoveOrphanFilesAction action3 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action3::run).doesNotThrowAnyException();
-
-        String withoutOlderThan =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
-                                : "CALL sys.remove_orphan_files('%s.%s')",
-                        database,
-                        "*");
-        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
-        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
-
-        String withParallelism =
-                String.format("CALL sys.remove_orphan_files('%s.%s','',true,5)", database, "*");
-        CloseableIterator<Row> withParallelismCollect = executeSQL(withParallelism);
-        assertThat(ImmutableList.copyOf(withParallelismCollect)).containsOnly(Row.of("0"));
-
-        String withDryRun =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true)"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
-                        database,
-                        "*");
-        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
-        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("4"));
-
-        String withOlderThan =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
-                        database,
-                        "*");
-        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
-
-        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
-    }
-
-    @ParameterizedTest
-    @ValueSource(booleans = {true, false})
-    public void testCleanWithBranch(boolean isNamedArgument) throws Exception {
-        // create main branch
-        FileStoreTable table = createTableAndWriteData(tableName);
-
-        // create first branch and write some data
-        table.createBranch("br");
-        SchemaManager schemaManager = new SchemaManager(table.fileIO(), table.location(), "br");
-        TableSchema branchSchema =
-                schemaManager.commitChanges(SchemaChange.addColumn("v2", DataTypes.INT()));
-        Options branchOptions = new Options(branchSchema.options());
-        branchOptions.set(CoreOptions.BRANCH, "br");
-        branchSchema = branchSchema.copy(branchOptions.toMap());
-        FileStoreTable branchTable =
-                FileStoreTableFactory.create(table.fileIO(), table.location(), branchSchema);
-
-        String commitUser = UUID.randomUUID().toString();
-        StreamTableWrite write = branchTable.newWrite(commitUser);
-        StreamTableCommit commit = branchTable.newCommit(commitUser);
-        write.write(GenericRow.of(2L, BinaryString.fromString("Hello"), 20));
-        commit.commit(1, write.prepareCommit(false, 1));
-        write.close();
-        commit.close();
-
-        // create orphan file in snapshot directory of first branch
-        Path orphanFile3 = new Path(table.location(), "branch/branch-br/snapshot/orphan_file3");
-        branchTable.fileIO().writeFile(orphanFile3, "x", true);
-
-        // create second branch, which is empty
-        table.createBranch("br2");
-
-        // create orphan file in snapshot directory of second branch
-        Path orphanFile4 = new Path(table.location(), "branch/branch-br2/snapshot/orphan_file4");
-        branchTable.fileIO().writeFile(orphanFile4, "y", true);
-
-        if (ThreadLocalRandom.current().nextBoolean()) {
-            executeSQL(
-                    String.format(
-                            "ALTER TABLE `%s`.`%s` SET ('%s' = 'br')",
-                            database, tableName, SCAN_FALLBACK_BRANCH.key()),
-                    false,
-                    true);
-        }
-        String procedure =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
-                        database,
-                        "*");
-        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(procedure));
-        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
-    }
-
-    @ParameterizedTest
-    @ValueSource(booleans = {true, false})
-    public void testRunWithMode(boolean isNamedArgument) throws Exception {
-        createTableAndWriteData(tableName);
-
-        List<String> args =
-                new ArrayList<>(
-                        Arrays.asList(
-                                "remove_orphan_files",
-                                "--warehouse",
-                                warehouse,
-                                "--database",
-                                database,
-                                "--table",
-                                tableName));
-        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action1::run).doesNotThrowAnyException();
-
-        args.add("--older_than");
-        args.add("2023-12-31 23:59:59");
-        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
-        assertThatCode(action2::run).doesNotThrowAnyException();
-
-        String withoutOlderThan =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
-                                : "CALL sys.remove_orphan_files('%s.%s')",
-                        database,
-                        tableName);
-        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
-        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
-
-        String withLocalMode =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'local')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'local')",
-                        database,
-                        tableName);
-        ImmutableList<Row> actualLocalRunDeleteFile =
-                ImmutableList.copyOf(executeSQL(withLocalMode));
-        assertThat(actualLocalRunDeleteFile).containsOnly(Row.of("2"));
-
-        String withDistributedMode =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'distributed')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'distributed')",
-                        database,
-                        tableName);
-        ImmutableList<Row> actualDistributedRunDeleteFile =
-                ImmutableList.copyOf(executeSQL(withDistributedMode));
-        assertThat(actualDistributedRunDeleteFile).containsOnly(Row.of("2"));
-
-        String withInvalidMode =
-                String.format(
-                        isNamedArgument
-                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'unknown')"
-                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'unknown')",
-                        database,
-                        tableName);
-        assertThatCode(() -> executeSQL(withInvalidMode))
-                .isInstanceOf(RuntimeException.class)
-                .hasMessageContaining("Unknown mode");
-    }
-}
+/** IT cases base for {@link RemoveOrphanFilesAction} in Flink Common. */
+public class RemoveOrphanFilesActionITCase extends RemoveOrphanFilesActionITCaseBase {}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java
new file mode 100644
index 0000000000000..5f874a5a7f9b2
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java
@@ -0,0 +1,341 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.schema.SchemaChange;
+import org.apache.paimon.schema.SchemaManager;
+import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.FileStoreTableFactory;
+import org.apache.paimon.table.sink.StreamTableCommit;
+import org.apache.paimon.table.sink.StreamTableWrite;
+import org.apache.paimon.table.sink.StreamWriteBuilder;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.RowType;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
+
+import org.apache.flink.types.Row;
+import org.apache.flink.util.CloseableIterator;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.ValueSource;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+import java.util.UUID;
+import java.util.concurrent.ThreadLocalRandom;
+
+import static org.apache.paimon.CoreOptions.SCAN_FALLBACK_BRANCH;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatCode;
+
+/** IT cases base for {@link RemoveOrphanFilesAction}. */
+public abstract class RemoveOrphanFilesActionITCaseBase extends ActionITCaseBase {
+
+    private static final String ORPHAN_FILE_1 = "bucket-0/orphan_file1";
+    private static final String ORPHAN_FILE_2 = "bucket-0/orphan_file2";
+
+    private FileStoreTable createTableAndWriteData(String tableName) throws Exception {
+        RowType rowType =
+                RowType.of(
+                        new DataType[] {DataTypes.BIGINT(), DataTypes.STRING()},
+                        new String[] {"k", "v"});
+
+        FileStoreTable table =
+                createFileStoreTable(
+                        tableName,
+                        rowType,
+                        Collections.emptyList(),
+                        Collections.singletonList("k"),
+                        Collections.emptyList(),
+                        Collections.emptyMap());
+
+        StreamWriteBuilder writeBuilder = table.newStreamWriteBuilder().withCommitUser(commitUser);
+        write = writeBuilder.newWrite();
+        commit = writeBuilder.newCommit();
+
+        writeData(rowData(1L, BinaryString.fromString("Hi")));
+
+        Path orphanFile1 = getOrphanFilePath(table, ORPHAN_FILE_1);
+        Path orphanFile2 = getOrphanFilePath(table, ORPHAN_FILE_2);
+
+        FileIO fileIO = table.fileIO();
+        fileIO.writeFile(orphanFile1, "a", true);
+        Thread.sleep(2000);
+        fileIO.writeFile(orphanFile2, "b", true);
+
+        return table;
+    }
+
+    private Path getOrphanFilePath(FileStoreTable table, String orphanFile) {
+        return new Path(table.location(), orphanFile);
+    }
+
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testRunWithoutException(boolean isNamedArgument) throws Exception {
+        createTableAndWriteData(tableName);
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                tableName));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
+                                : "CALL sys.remove_orphan_files('%s.%s')",
+                        database,
+                        tableName);
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withDryRun =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true)"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
+                        database,
+                        tableName);
+        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
+        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withOlderThan =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database,
+                        tableName);
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
+
+        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"));
+    }
+
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testRemoveDatabaseOrphanFilesITCase(boolean isNamedArgument) throws Exception {
+        createTableAndWriteData("tableName1");
+        createTableAndWriteData("tableName2");
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                "*"));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        args.add("--parallelism");
+        args.add("5");
+        RemoveOrphanFilesAction action3 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action3::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
+                                : "CALL sys.remove_orphan_files('%s.%s')",
+                        database,
+                        "*");
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withParallelism =
+                String.format("CALL sys.remove_orphan_files('%s.%s','',true,5)", database, "*");
+        CloseableIterator<Row> withParallelismCollect = executeSQL(withParallelism);
+        assertThat(ImmutableList.copyOf(withParallelismCollect)).containsOnly(Row.of("0"));
+
+        String withDryRun =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true)"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true)",
+                        database,
+                        "*");
+        ImmutableList<Row> actualDryRunDeleteFile = ImmutableList.copyOf(executeSQL(withDryRun));
+        assertThat(actualDryRunDeleteFile).containsOnly(Row.of("4"));
+
+        String withOlderThan =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database,
+                        "*");
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
+
+        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
+    }
+
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testCleanWithBranch(boolean isNamedArgument) throws Exception {
+        // create main branch
+        FileStoreTable table = createTableAndWriteData(tableName);
+
+        // create first branch and write some data
+        table.createBranch("br");
+        SchemaManager schemaManager = new SchemaManager(table.fileIO(), table.location(), "br");
+        TableSchema branchSchema =
+                schemaManager.commitChanges(SchemaChange.addColumn("v2", DataTypes.INT()));
+        Options branchOptions = new Options(branchSchema.options());
+        branchOptions.set(CoreOptions.BRANCH, "br");
+        branchSchema = branchSchema.copy(branchOptions.toMap());
+        FileStoreTable branchTable =
+                FileStoreTableFactory.create(table.fileIO(), table.location(), branchSchema);
+
+        String commitUser = UUID.randomUUID().toString();
+        StreamTableWrite write = branchTable.newWrite(commitUser);
+        StreamTableCommit commit = branchTable.newCommit(commitUser);
+        write.write(GenericRow.of(2L, BinaryString.fromString("Hello"), 20));
+        commit.commit(1, write.prepareCommit(false, 1));
+        write.close();
+        commit.close();
+
+        // create orphan file in snapshot directory of first branch
+        Path orphanFile3 = new Path(table.location(), "branch/branch-br/snapshot/orphan_file3");
+        branchTable.fileIO().writeFile(orphanFile3, "x", true);
+
+        // create second branch, which is empty
+        table.createBranch("br2");
+
+        // create orphan file in snapshot directory of second branch
+        Path orphanFile4 = new Path(table.location(), "branch/branch-br2/snapshot/orphan_file4");
+        branchTable.fileIO().writeFile(orphanFile4, "y", true);
+
+        if (ThreadLocalRandom.current().nextBoolean()) {
+            executeSQL(
+                    String.format(
+                            "ALTER TABLE `%s`.`%s` SET ('%s' = 'br')",
+                            database, tableName, SCAN_FALLBACK_BRANCH.key()),
+                    false,
+                    true);
+        }
+        String procedure =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59')",
+                        database,
+                        "*");
+        ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(procedure));
+        assertThat(actualDeleteFile).containsOnly(Row.of("4"));
+    }
+
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testRunWithMode(boolean isNamedArgument) throws Exception {
+        createTableAndWriteData(tableName);
+
+        List<String> args =
+                new ArrayList<>(
+                        Arrays.asList(
+                                "remove_orphan_files",
+                                "--warehouse",
+                                warehouse,
+                                "--database",
+                                database,
+                                "--table",
+                                tableName));
+        RemoveOrphanFilesAction action1 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action1::run).doesNotThrowAnyException();
+
+        args.add("--older_than");
+        args.add("2023-12-31 23:59:59");
+        RemoveOrphanFilesAction action2 = createAction(RemoveOrphanFilesAction.class, args);
+        assertThatCode(action2::run).doesNotThrowAnyException();
+
+        String withoutOlderThan =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s')"
+                                : "CALL sys.remove_orphan_files('%s.%s')",
+                        database,
+                        tableName);
+        CloseableIterator<Row> withoutOlderThanCollect = executeSQL(withoutOlderThan);
+        assertThat(ImmutableList.copyOf(withoutOlderThanCollect)).containsOnly(Row.of("0"));
+
+        String withLocalMode =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'local')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'local')",
+                        database,
+                        tableName);
+        ImmutableList<Row> actualLocalRunDeleteFile =
+                ImmutableList.copyOf(executeSQL(withLocalMode));
+        assertThat(actualLocalRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withDistributedMode =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'distributed')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'distributed')",
+                        database,
+                        tableName);
+        ImmutableList<Row> actualDistributedRunDeleteFile =
+                ImmutableList.copyOf(executeSQL(withDistributedMode));
+        assertThat(actualDistributedRunDeleteFile).containsOnly(Row.of("2"));
+
+        String withInvalidMode =
+                String.format(
+                        isNamedArgument
+                                ? "CALL sys.remove_orphan_files(`table` => '%s.%s', older_than => '2999-12-31 23:59:59', dry_run => true, parallelism => 5, mode => 'unknown')"
+                                : "CALL sys.remove_orphan_files('%s.%s', '2999-12-31 23:59:59', true, 5, 'unknown')",
+                        database,
+                        tableName);
+        assertThatCode(() -> executeSQL(withInvalidMode))
+                .isInstanceOf(RuntimeException.class)
+                .hasMessageContaining("Unknown mode");
+    }
+}

From 06fbb5e1f1d9162c87dac6e707c38315beb4f6a8 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Tue, 19 Nov 2024 20:20:57 +0800
Subject: [PATCH 034/157] [orc] Add type id to orc files (#4523)

---
 .../paimon/format/orc/OrcFileFormat.java      |   8 +-
 .../paimon/format/orc/OrcReaderFactory.java   |   4 +-
 .../apache/paimon/format/orc/OrcTypeUtil.java | 147 +++++++++++++
 .../format/orc/reader/OrcSplitReaderUtil.java |  99 ---------
 .../format/orc/writer/RowDataVectorizer.java  |   3 +-
 .../paimon/format/orc/writer/Vectorizer.java  |   4 +-
 .../format/orc/OrcSplitReaderUtilTest.java    |  68 ------
 .../paimon/format/orc/OrcTypeUtilTest.java    | 206 ++++++++++++++++++
 .../format/orc/OrcWriterFactoryTest.java      |   3 +-
 9 files changed, 364 insertions(+), 178 deletions(-)
 create mode 100644 paimon-format/src/main/java/org/apache/paimon/format/orc/OrcTypeUtil.java
 delete mode 100644 paimon-format/src/main/java/org/apache/paimon/format/orc/reader/OrcSplitReaderUtil.java
 delete mode 100644 paimon-format/src/test/java/org/apache/paimon/format/orc/OrcSplitReaderUtilTest.java
 create mode 100644 paimon-format/src/test/java/org/apache/paimon/format/orc/OrcTypeUtilTest.java

diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcFileFormat.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcFileFormat.java
index c564b69409c5b..c3521c6f1a37d 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcFileFormat.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcFileFormat.java
@@ -28,7 +28,6 @@
 import org.apache.paimon.format.orc.filter.OrcFilters;
 import org.apache.paimon.format.orc.filter.OrcPredicateFunctionVisitor;
 import org.apache.paimon.format.orc.filter.OrcSimpleStatsExtractor;
-import org.apache.paimon.format.orc.reader.OrcSplitReaderUtil;
 import org.apache.paimon.format.orc.writer.RowDataVectorizer;
 import org.apache.paimon.format.orc.writer.Vectorizer;
 import org.apache.paimon.options.MemorySize;
@@ -123,7 +122,7 @@ public FormatReaderFactory createReaderFactory(
     @Override
     public void validateDataFields(RowType rowType) {
         DataType refinedType = refineDataType(rowType);
-        OrcSplitReaderUtil.toOrcType(refinedType);
+        OrcTypeUtil.convertToOrcSchema((RowType) refinedType);
     }
 
     /**
@@ -141,9 +140,8 @@ public FormatWriterFactory createWriterFactory(RowType type) {
         DataType refinedType = refineDataType(type);
         DataType[] orcTypes = getFieldTypes(refinedType).toArray(new DataType[0]);
 
-        TypeDescription typeDescription = OrcSplitReaderUtil.toOrcType(refinedType);
-        Vectorizer<InternalRow> vectorizer =
-                new RowDataVectorizer(typeDescription.toString(), orcTypes);
+        TypeDescription typeDescription = OrcTypeUtil.convertToOrcSchema((RowType) refinedType);
+        Vectorizer<InternalRow> vectorizer = new RowDataVectorizer(typeDescription, orcTypes);
 
         return new OrcWriterFactory(vectorizer, orcProperties, writerConf, writeBatchSize);
     }
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
index 05f3dd7851e84..ee0f8a55c0346 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
@@ -55,8 +55,8 @@
 import java.io.IOException;
 import java.util.List;
 
+import static org.apache.paimon.format.orc.OrcTypeUtil.convertToOrcSchema;
 import static org.apache.paimon.format.orc.reader.AbstractOrcColumnVector.createPaimonVector;
-import static org.apache.paimon.format.orc.reader.OrcSplitReaderUtil.toOrcType;
 import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
 /** An ORC reader that produces a stream of {@link ColumnarRow} records. */
@@ -81,7 +81,7 @@ public OrcReaderFactory(
             final int batchSize,
             final boolean deletionVectorsEnabled) {
         this.hadoopConfig = checkNotNull(hadoopConfig);
-        this.schema = toOrcType(readType);
+        this.schema = convertToOrcSchema(readType);
         this.tableType = readType;
         this.conjunctPredicates = checkNotNull(conjunctPredicates);
         this.batchSize = batchSize;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcTypeUtil.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcTypeUtil.java
new file mode 100644
index 0000000000000..f7d3d626d44f7
--- /dev/null
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcTypeUtil.java
@@ -0,0 +1,147 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.format.orc;
+
+import org.apache.paimon.annotation.VisibleForTesting;
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.types.ArrayType;
+import org.apache.paimon.types.CharType;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.DecimalType;
+import org.apache.paimon.types.MapType;
+import org.apache.paimon.types.RowType;
+import org.apache.paimon.types.VarCharType;
+
+import org.apache.orc.TypeDescription;
+
+/** Util for orc types. */
+public class OrcTypeUtil {
+
+    public static final String PAIMON_ORC_FIELD_ID_KEY = "paimon.id";
+
+    public static TypeDescription convertToOrcSchema(RowType rowType) {
+        TypeDescription struct = TypeDescription.createStruct();
+        for (DataField dataField : rowType.getFields()) {
+            TypeDescription child = convertToOrcType(dataField.type(), dataField.id(), 0);
+            struct.addField(dataField.name(), child);
+        }
+        return struct;
+    }
+
+    @VisibleForTesting
+    static TypeDescription convertToOrcType(DataType type, int fieldId, int depth) {
+        type = type.copy(true);
+        switch (type.getTypeRoot()) {
+            case CHAR:
+                return TypeDescription.createChar()
+                        .withMaxLength(((CharType) type).getLength())
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case VARCHAR:
+                int len = ((VarCharType) type).getLength();
+                if (len == VarCharType.MAX_LENGTH) {
+                    return TypeDescription.createString()
+                            .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+                } else {
+                    return TypeDescription.createVarchar()
+                            .withMaxLength(len)
+                            .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+                }
+            case BOOLEAN:
+                return TypeDescription.createBoolean()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case VARBINARY:
+                if (type.equals(DataTypes.BYTES())) {
+                    return TypeDescription.createBinary()
+                            .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+                } else {
+                    throw new UnsupportedOperationException(
+                            "Not support other binary type: " + type);
+                }
+            case DECIMAL:
+                DecimalType decimalType = (DecimalType) type;
+                return TypeDescription.createDecimal()
+                        .withScale(decimalType.getScale())
+                        .withPrecision(decimalType.getPrecision())
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case TINYINT:
+                return TypeDescription.createByte()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case SMALLINT:
+                return TypeDescription.createShort()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case INTEGER:
+            case TIME_WITHOUT_TIME_ZONE:
+                return TypeDescription.createInt()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case BIGINT:
+                return TypeDescription.createLong()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case FLOAT:
+                return TypeDescription.createFloat()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case DOUBLE:
+                return TypeDescription.createDouble()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case DATE:
+                return TypeDescription.createDate()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case TIMESTAMP_WITHOUT_TIME_ZONE:
+                return TypeDescription.createTimestamp()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
+                return TypeDescription.createTimestampInstant()
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case ARRAY:
+                ArrayType arrayType = (ArrayType) type;
+
+                String elementFieldId =
+                        String.valueOf(SpecialFields.getArrayElementFieldId(fieldId, depth + 1));
+                TypeDescription elementOrcType =
+                        convertToOrcType(arrayType.getElementType(), fieldId, depth + 1)
+                                .setAttribute(PAIMON_ORC_FIELD_ID_KEY, elementFieldId);
+
+                return TypeDescription.createList(elementOrcType)
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case MAP:
+                MapType mapType = (MapType) type;
+
+                String mapKeyFieldId =
+                        String.valueOf(SpecialFields.getMapKeyFieldId(fieldId, depth + 1));
+                TypeDescription mapKeyOrcType =
+                        convertToOrcType(mapType.getKeyType(), fieldId, depth + 1)
+                                .setAttribute(PAIMON_ORC_FIELD_ID_KEY, mapKeyFieldId);
+
+                String mapValueFieldId =
+                        String.valueOf(SpecialFields.getMapValueFieldId(fieldId, depth + 1));
+                TypeDescription mapValueOrcType =
+                        convertToOrcType(mapType.getValueType(), fieldId, depth + 1)
+                                .setAttribute(PAIMON_ORC_FIELD_ID_KEY, mapValueFieldId);
+
+                return TypeDescription.createMap(mapKeyOrcType, mapValueOrcType)
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            case ROW:
+                return convertToOrcSchema((RowType) type)
+                        .setAttribute(PAIMON_ORC_FIELD_ID_KEY, String.valueOf(fieldId));
+            default:
+                throw new UnsupportedOperationException("Unsupported type: " + type);
+        }
+    }
+}
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/reader/OrcSplitReaderUtil.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/reader/OrcSplitReaderUtil.java
deleted file mode 100644
index 882f1c753991f..0000000000000
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/reader/OrcSplitReaderUtil.java
+++ /dev/null
@@ -1,99 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.format.orc.reader;
-
-import org.apache.paimon.types.ArrayType;
-import org.apache.paimon.types.CharType;
-import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypes;
-import org.apache.paimon.types.DecimalType;
-import org.apache.paimon.types.MapType;
-import org.apache.paimon.types.RowType;
-import org.apache.paimon.types.VarCharType;
-
-import org.apache.orc.TypeDescription;
-
-/** Util for orc types. */
-public class OrcSplitReaderUtil {
-
-    public static TypeDescription toOrcType(DataType type) {
-        type = type.copy(true);
-        switch (type.getTypeRoot()) {
-            case CHAR:
-                return TypeDescription.createChar().withMaxLength(((CharType) type).getLength());
-            case VARCHAR:
-                int len = ((VarCharType) type).getLength();
-                if (len == VarCharType.MAX_LENGTH) {
-                    return TypeDescription.createString();
-                } else {
-                    return TypeDescription.createVarchar().withMaxLength(len);
-                }
-            case BOOLEAN:
-                return TypeDescription.createBoolean();
-            case VARBINARY:
-                if (type.equals(DataTypes.BYTES())) {
-                    return TypeDescription.createBinary();
-                } else {
-                    throw new UnsupportedOperationException(
-                            "Not support other binary type: " + type);
-                }
-            case DECIMAL:
-                DecimalType decimalType = (DecimalType) type;
-                return TypeDescription.createDecimal()
-                        .withScale(decimalType.getScale())
-                        .withPrecision(decimalType.getPrecision());
-            case TINYINT:
-                return TypeDescription.createByte();
-            case SMALLINT:
-                return TypeDescription.createShort();
-            case INTEGER:
-            case TIME_WITHOUT_TIME_ZONE:
-                return TypeDescription.createInt();
-            case BIGINT:
-                return TypeDescription.createLong();
-            case FLOAT:
-                return TypeDescription.createFloat();
-            case DOUBLE:
-                return TypeDescription.createDouble();
-            case DATE:
-                return TypeDescription.createDate();
-            case TIMESTAMP_WITHOUT_TIME_ZONE:
-                return TypeDescription.createTimestamp();
-            case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
-                return TypeDescription.createTimestampInstant();
-            case ARRAY:
-                ArrayType arrayType = (ArrayType) type;
-                return TypeDescription.createList(toOrcType(arrayType.getElementType()));
-            case MAP:
-                MapType mapType = (MapType) type;
-                return TypeDescription.createMap(
-                        toOrcType(mapType.getKeyType()), toOrcType(mapType.getValueType()));
-            case ROW:
-                RowType rowType = (RowType) type;
-                TypeDescription struct = TypeDescription.createStruct();
-                for (int i = 0; i < rowType.getFieldCount(); i++) {
-                    struct.addField(
-                            rowType.getFieldNames().get(i), toOrcType(rowType.getTypeAt(i)));
-                }
-                return struct;
-            default:
-                throw new UnsupportedOperationException("Unsupported type: " + type);
-        }
-    }
-}
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/RowDataVectorizer.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/RowDataVectorizer.java
index 21443cdf94634..46c936a0263ee 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/RowDataVectorizer.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/RowDataVectorizer.java
@@ -23,6 +23,7 @@
 
 import org.apache.hadoop.hive.ql.exec.vector.ColumnVector;
 import org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch;
+import org.apache.orc.TypeDescription;
 
 import java.util.Arrays;
 import java.util.List;
@@ -35,7 +36,7 @@ public class RowDataVectorizer extends Vectorizer<InternalRow> {
 
     private final List<FieldWriter> fieldWriters;
 
-    public RowDataVectorizer(String schema, DataType[] fieldTypes) {
+    public RowDataVectorizer(TypeDescription schema, DataType[] fieldTypes) {
         super(schema);
         this.fieldWriters =
                 Arrays.stream(fieldTypes)
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/Vectorizer.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/Vectorizer.java
index 0f0e6bba74a84..2add46531a618 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/Vectorizer.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/writer/Vectorizer.java
@@ -39,9 +39,9 @@ public abstract class Vectorizer<T> implements Serializable {
 
     private final TypeDescription schema;
 
-    public Vectorizer(final String schema) {
+    public Vectorizer(final TypeDescription schema) {
         checkNotNull(schema);
-        this.schema = TypeDescription.fromString(schema);
+        this.schema = schema;
     }
 
     /**
diff --git a/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcSplitReaderUtilTest.java b/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcSplitReaderUtilTest.java
deleted file mode 100644
index c07838dfa34ca..0000000000000
--- a/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcSplitReaderUtilTest.java
+++ /dev/null
@@ -1,68 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.format.orc;
-
-import org.apache.paimon.format.orc.reader.OrcSplitReaderUtil;
-import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypes;
-
-import org.junit.jupiter.api.Test;
-
-import static org.apache.paimon.format.orc.reader.OrcSplitReaderUtil.toOrcType;
-import static org.assertj.core.api.Assertions.assertThat;
-
-/** Test for {@link OrcSplitReaderUtil}. */
-class OrcSplitReaderUtilTest {
-
-    @Test
-    void testDataTypeToOrcType() {
-        test("boolean", DataTypes.BOOLEAN());
-        test("char(123)", DataTypes.CHAR(123));
-        test("varchar(123)", DataTypes.VARCHAR(123));
-        test("string", DataTypes.STRING());
-        test("binary", DataTypes.BYTES());
-        test("tinyint", DataTypes.TINYINT());
-        test("smallint", DataTypes.SMALLINT());
-        test("int", DataTypes.INT());
-        test("bigint", DataTypes.BIGINT());
-        test("float", DataTypes.FLOAT());
-        test("double", DataTypes.DOUBLE());
-        test("date", DataTypes.DATE());
-        test("timestamp", DataTypes.TIMESTAMP());
-        test("array<float>", DataTypes.ARRAY(DataTypes.FLOAT()));
-        test("map<float,bigint>", DataTypes.MAP(DataTypes.FLOAT(), DataTypes.BIGINT()));
-        test(
-                "struct<int0:int,str1:string,double2:double,row3:struct<int0:int,int1:int>>",
-                DataTypes.ROW(
-                        DataTypes.FIELD(0, "int0", DataTypes.INT()),
-                        DataTypes.FIELD(1, "str1", DataTypes.STRING()),
-                        DataTypes.FIELD(2, "double2", DataTypes.DOUBLE()),
-                        DataTypes.FIELD(
-                                3,
-                                "row3",
-                                DataTypes.ROW(
-                                        DataTypes.FIELD(4, "int0", DataTypes.INT()),
-                                        DataTypes.FIELD(5, "int1", DataTypes.INT())))));
-        test("decimal(4,2)", DataTypes.DECIMAL(4, 2));
-    }
-
-    private void test(String expected, DataType type) {
-        assertThat(toOrcType(type)).hasToString(expected);
-    }
-}
diff --git a/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcTypeUtilTest.java b/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcTypeUtilTest.java
new file mode 100644
index 0000000000000..5669ac33d443e
--- /dev/null
+++ b/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcTypeUtilTest.java
@@ -0,0 +1,206 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.format.orc;
+
+import org.apache.paimon.format.FileFormatFactory;
+import org.apache.paimon.format.FormatWriter;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.fs.PositionOutputStream;
+import org.apache.paimon.fs.local.LocalFileIO;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.RowType;
+
+import org.apache.paimon.shade.guava30.com.google.common.base.Objects;
+
+import org.apache.hadoop.conf.Configuration;
+import org.apache.orc.Reader;
+import org.apache.orc.TypeDescription;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.io.TempDir;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.UUID;
+import java.util.concurrent.atomic.AtomicInteger;
+
+import static org.apache.paimon.format.orc.OrcFileFormat.refineDataType;
+import static org.apache.paimon.format.orc.OrcTypeUtil.PAIMON_ORC_FIELD_ID_KEY;
+import static org.apache.paimon.format.orc.OrcTypeUtil.convertToOrcSchema;
+import static org.apache.paimon.format.orc.OrcTypeUtil.convertToOrcType;
+import static org.apache.paimon.utils.Preconditions.checkArgument;
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatNoException;
+
+/** Test for {@link OrcTypeUtil}. */
+class OrcTypeUtilTest {
+
+    @Test
+    void testDataTypeToOrcType() {
+        test("boolean", DataTypes.BOOLEAN());
+        test("char(123)", DataTypes.CHAR(123));
+        test("varchar(123)", DataTypes.VARCHAR(123));
+        test("string", DataTypes.STRING());
+        test("binary", DataTypes.BYTES());
+        test("tinyint", DataTypes.TINYINT());
+        test("smallint", DataTypes.SMALLINT());
+        test("int", DataTypes.INT());
+        test("bigint", DataTypes.BIGINT());
+        test("float", DataTypes.FLOAT());
+        test("double", DataTypes.DOUBLE());
+        test("date", DataTypes.DATE());
+        test("timestamp", DataTypes.TIMESTAMP());
+        test("array<float>", DataTypes.ARRAY(DataTypes.FLOAT()));
+        test("map<float,bigint>", DataTypes.MAP(DataTypes.FLOAT(), DataTypes.BIGINT()));
+        test(
+                "struct<int0:int,str1:string,double2:double,row3:struct<int0:int,int1:int>>",
+                DataTypes.ROW(
+                        DataTypes.FIELD(0, "int0", DataTypes.INT()),
+                        DataTypes.FIELD(1, "str1", DataTypes.STRING()),
+                        DataTypes.FIELD(2, "double2", DataTypes.DOUBLE()),
+                        DataTypes.FIELD(
+                                3,
+                                "row3",
+                                DataTypes.ROW(
+                                        DataTypes.FIELD(4, "int0", DataTypes.INT()),
+                                        DataTypes.FIELD(5, "int1", DataTypes.INT())))));
+        test("decimal(4,2)", DataTypes.DECIMAL(4, 2));
+    }
+
+    private void test(String expected, DataType type) {
+        assertThat(convertToOrcType(type, -1, -1)).hasToString(expected);
+    }
+
+    @Test
+    void testFieldIdAttribute(@TempDir java.nio.file.Path tempPath) throws IOException {
+        RowType rowType =
+                RowType.builder()
+                        .field("a", DataTypes.INT())
+                        .field(
+                                "b",
+                                RowType.builder(true, new AtomicInteger(10))
+                                        .field("f0", DataTypes.STRING())
+                                        .field("f1", DataTypes.INT())
+                                        .build())
+                        .field("c", DataTypes.ARRAY(DataTypes.INT()))
+                        .field("d", DataTypes.MAP(DataTypes.INT(), DataTypes.STRING()))
+                        .field(
+                                "e",
+                                DataTypes.ARRAY(
+                                        RowType.builder(true, new AtomicInteger(20))
+                                                .field("f0", DataTypes.STRING())
+                                                .field("f1", DataTypes.INT())
+                                                .build()))
+                        .field(
+                                "f",
+                                RowType.builder(true, new AtomicInteger(30))
+                                        .field("f0", DataTypes.ARRAY(DataTypes.INT()))
+                                        .build())
+                        .build();
+
+        // write schema to orc file then get
+        FileIO fileIO = LocalFileIO.create();
+        Path tempFile = new Path(new Path(tempPath.toUri()), UUID.randomUUID().toString());
+
+        OrcFileFormat format =
+                new OrcFileFormat(new FileFormatFactory.FormatContext(new Options(), 1024, 1024));
+        PositionOutputStream out = fileIO.newOutputStream(tempFile, false);
+        FormatWriter writer = format.createWriterFactory(rowType).create(out, "zstd");
+        writer.close();
+        out.close();
+
+        Reader orcReader =
+                OrcReaderFactory.createReader(new Configuration(), fileIO, tempFile, null);
+        TypeDescription orcSchema = orcReader.getSchema();
+
+        RowType refined = (RowType) refineDataType(rowType);
+
+        assertThatNoException()
+                .isThrownBy(() -> checkStruct(convertToOrcSchema(refined), orcSchema));
+
+        assertThatNoException()
+                .isThrownBy(
+                        () ->
+                                checkStruct(
+                                        convertToOrcSchema(refined.project("c", "b", "d")),
+                                        orcSchema));
+
+        assertThatNoException()
+                .isThrownBy(
+                        () ->
+                                checkStruct(
+                                        convertToOrcSchema(refined.project("a", "e", "f")),
+                                        orcSchema));
+    }
+
+    private void checkStruct(TypeDescription requiredStruct, TypeDescription orcStruct) {
+        List<String> requiredFields = requiredStruct.getFieldNames();
+        List<TypeDescription> requiredTypes = requiredStruct.getChildren();
+        List<String> orcFields = orcStruct.getFieldNames();
+        List<TypeDescription> orcTypes = orcStruct.getChildren();
+
+        for (int i = 0; i < requiredFields.size(); i++) {
+            String field = requiredFields.get(i);
+            int orcIndex = orcFields.indexOf(field);
+            checkArgument(orcIndex != -1, "Cannot find field %s in orc file meta.", field);
+            TypeDescription requiredType = requiredTypes.get(i);
+            TypeDescription orcType = orcTypes.get(orcIndex);
+            checkField(field, requiredType, orcType);
+        }
+    }
+
+    private void checkField(
+            String fieldName, TypeDescription requiredType, TypeDescription orcType) {
+        checkFieldIdAttribute(fieldName, requiredType, orcType);
+        if (requiredType.getCategory().isPrimitive()) {
+            return;
+        }
+
+        switch (requiredType.getCategory()) {
+            case LIST:
+                checkField(
+                        "_elem", requiredType.getChildren().get(0), orcType.getChildren().get(0));
+                return;
+            case MAP:
+                checkField("_key", requiredType.getChildren().get(0), orcType.getChildren().get(0));
+                checkField(
+                        "_value", requiredType.getChildren().get(1), orcType.getChildren().get(1));
+                return;
+            case STRUCT:
+                checkStruct(requiredType, orcType);
+                return;
+            default:
+                throw new UnsupportedOperationException("Unsupported orc type: " + requiredType);
+        }
+    }
+
+    private void checkFieldIdAttribute(
+            String fieldName, TypeDescription requiredType, TypeDescription orcType) {
+        String requiredId = requiredType.getAttributeValue(PAIMON_ORC_FIELD_ID_KEY);
+        String orcId = orcType.getAttributeValue(PAIMON_ORC_FIELD_ID_KEY);
+        checkArgument(
+                Objects.equal(requiredId, orcId),
+                "Field %s has different id: read type id is %s but orc type id is %s. This is unexpected.",
+                fieldName,
+                requiredId,
+                orcId);
+    }
+}
diff --git a/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcWriterFactoryTest.java b/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcWriterFactoryTest.java
index 2511d7ed7a9e5..52df5afb4efd6 100644
--- a/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcWriterFactoryTest.java
+++ b/paimon-format/src/test/java/org/apache/paimon/format/orc/OrcWriterFactoryTest.java
@@ -28,6 +28,7 @@
 import org.apache.hadoop.fs.Path;
 import org.apache.orc.MemoryManager;
 import org.apache.orc.OrcFile;
+import org.apache.orc.TypeDescription;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.io.TempDir;
 
@@ -47,7 +48,7 @@ void testNotOverrideInMemoryManager(@TempDir java.nio.file.Path tmpDir) throws I
         OrcWriterFactory factory =
                 new TestOrcWriterFactory(
                         new RowDataVectorizer(
-                                "struct<_col0:string,_col1:int>",
+                                TypeDescription.fromString("struct<_col0:string,_col1:int>"),
                                 new DataType[] {DataTypes.STRING(), DataTypes.INT()}),
                         memoryManager);
         factory.create(new LocalPositionOutputStream(tmpDir.resolve("file1").toFile()), "LZ4");

From da4d64b4b6afd8685447aed6227e2ca67cfba8b1 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 20 Nov 2024 13:00:35 +0800
Subject: [PATCH 035/157] [core] Remove FileStoreScan.withManifestList and fix
 unstable test (#4552)

---
 .../operation/AbstractFileStoreScan.java      |  15 ---
 .../paimon/operation/FileStoreScan.java       |   2 -
 .../java/org/apache/paimon/TestFileStore.java | 104 ++++++++++--------
 .../paimon/operation/ExpireSnapshotsTest.java |   3 +-
 .../operation/KeyValueFileStoreScanTest.java  |  25 -----
 .../paimon/table/FileStoreTableTestBase.java  |   4 +-
 6 files changed, 62 insertions(+), 91 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
index 98e064451509b..c73a92062b808 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreScan.java
@@ -63,7 +63,6 @@
 import static org.apache.paimon.utils.ManifestReadThreadPool.randomlyExecuteSequentialReturn;
 import static org.apache.paimon.utils.ManifestReadThreadPool.sequentialBatchedExecute;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
-import static org.apache.paimon.utils.Preconditions.checkState;
 import static org.apache.paimon.utils.ThreadPoolUtils.randomlyOnlyExecute;
 
 /** Default implementation of {@link FileStoreScan}. */
@@ -81,7 +80,6 @@ public abstract class AbstractFileStoreScan implements FileStoreScan {
     private Snapshot specifiedSnapshot = null;
     private Filter<Integer> bucketFilter = null;
     private BiFilter<Integer, Integer> totalAwareBucketFilter = null;
-    private List<ManifestFileMeta> specifiedManifests = null;
     protected ScanMode scanMode = ScanMode.ALL;
     private Filter<Integer> levelFilter = null;
     private Filter<ManifestEntry> manifestEntryFilter = null;
@@ -161,25 +159,16 @@ public FileStoreScan withPartitionBucket(BinaryRow partition, int bucket) {
 
     @Override
     public FileStoreScan withSnapshot(long snapshotId) {
-        checkState(specifiedManifests == null, "Cannot set both snapshot and manifests.");
         this.specifiedSnapshot = snapshotManager.snapshot(snapshotId);
         return this;
     }
 
     @Override
     public FileStoreScan withSnapshot(Snapshot snapshot) {
-        checkState(specifiedManifests == null, "Cannot set both snapshot and manifests.");
         this.specifiedSnapshot = snapshot;
         return this;
     }
 
-    @Override
-    public FileStoreScan withManifestList(List<ManifestFileMeta> manifests) {
-        checkState(specifiedSnapshot == null, "Cannot set both snapshot and manifests.");
-        this.specifiedManifests = manifests;
-        return this;
-    }
-
     @Override
     public FileStoreScan withKind(ScanMode scanMode) {
         this.scanMode = scanMode;
@@ -401,10 +390,6 @@ private <T extends FileEntry> Iterator<T> readAndNoMergeFileEntries(
     }
 
     private ManifestsReader.Result readManifests() {
-        if (specifiedManifests != null) {
-            return new ManifestsReader.Result(null, specifiedManifests, specifiedManifests);
-        }
-
         return manifestsReader.read(specifiedSnapshot, scanMode);
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
index 7663f48229c63..179d16de6cd22 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreScan.java
@@ -67,8 +67,6 @@ public interface FileStoreScan {
 
     FileStoreScan withSnapshot(Snapshot snapshot);
 
-    FileStoreScan withManifestList(List<ManifestFileMeta> manifests);
-
     FileStoreScan withKind(ScanMode scanMode);
 
     FileStoreScan withLevelFilter(Filter<Integer> levelFilter);
diff --git a/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java b/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
index 5218a515a3374..0d8ea5f4a49a5 100644
--- a/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
+++ b/paimon-core/src/test/java/org/apache/paimon/TestFileStore.java
@@ -26,10 +26,12 @@
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.IndexIncrement;
+import org.apache.paimon.manifest.FileEntry;
 import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.FileSource;
 import org.apache.paimon.manifest.ManifestCommittable;
 import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.manifest.ManifestList;
 import org.apache.paimon.memory.HeapMemorySegmentPool;
@@ -38,7 +40,6 @@
 import org.apache.paimon.operation.AbstractFileStoreWrite;
 import org.apache.paimon.operation.FileStoreCommit;
 import org.apache.paimon.operation.FileStoreCommitImpl;
-import org.apache.paimon.operation.FileStoreScan;
 import org.apache.paimon.operation.SplitRead;
 import org.apache.paimon.options.ExpireConfig;
 import org.apache.paimon.options.MemorySize;
@@ -561,29 +562,41 @@ public Set<Path> getFilesInUse(long snapshotId) {
         return getFilesInUse(
                 snapshotId,
                 snapshotManager(),
-                newScan(),
                 fileIO,
                 pathFactory(),
-                manifestListFactory().create());
+                manifestListFactory().create(),
+                manifestFileFactory().create());
     }
 
     public static Set<Path> getFilesInUse(
             long snapshotId,
             SnapshotManager snapshotManager,
-            FileStoreScan scan,
             FileIO fileIO,
             FileStorePathFactory pathFactory,
-            ManifestList manifestList) {
+            ManifestList manifestList,
+            ManifestFile manifestFile) {
         Set<Path> result = new HashSet<>();
 
         if (snapshotManager.snapshotExists(snapshotId)) {
-            result.addAll(
+            Set<Path> files =
                     getSnapshotFileInUse(
-                            snapshotId, snapshotManager, scan, fileIO, pathFactory, manifestList));
+                            snapshotId,
+                            snapshotManager,
+                            fileIO,
+                            pathFactory,
+                            manifestList,
+                            manifestFile);
+            result.addAll(files);
         } else if (snapshotManager.longLivedChangelogExists(snapshotId)) {
-            result.addAll(
+            Set<Path> files =
                     getChangelogFileInUse(
-                            snapshotId, snapshotManager, scan, fileIO, pathFactory, manifestList));
+                            snapshotId,
+                            snapshotManager,
+                            fileIO,
+                            pathFactory,
+                            manifestList,
+                            manifestFile);
+            result.addAll(files);
         } else {
             throw new RuntimeException(
                     String.format("The snapshot %s does not exist.", snapshotId));
@@ -595,10 +608,10 @@ public static Set<Path> getFilesInUse(
     private static Set<Path> getSnapshotFileInUse(
             long snapshotId,
             SnapshotManager snapshotManager,
-            FileStoreScan scan,
             FileIO fileIO,
             FileStorePathFactory pathFactory,
-            ManifestList manifestList) {
+            ManifestList manifestList,
+            ManifestFile manifestFile) {
         Set<Path> result = new HashSet<>();
         SchemaManager schemaManager = new SchemaManager(fileIO, snapshotManager.tablePath());
         CoreOptions options = new CoreOptions(schemaManager.latest().get().options());
@@ -625,7 +638,11 @@ private static Set<Path> getSnapshotFileInUse(
         manifests.forEach(m -> result.add(pathFactory.toManifestFilePath(m.fileName())));
 
         // data file
-        List<ManifestEntry> entries = scan.withManifestList(manifests).plan().files();
+        List<ManifestEntry> entries =
+                manifests.stream()
+                        .flatMap(m -> manifestFile.read(m.fileName()).stream())
+                        .collect(Collectors.toList());
+        entries = new ArrayList<>(FileEntry.mergeEntries(entries));
         for (ManifestEntry entry : entries) {
             result.add(
                     new Path(
@@ -641,7 +658,9 @@ private static Set<Path> getSnapshotFileInUse(
         // use list.
         if (changelogDecoupled && !produceChangelog) {
             entries =
-                    scan.withManifestList(manifestList.readDeltaManifests(snapshot)).plan().files();
+                    manifestList.readDeltaManifests(snapshot).stream()
+                            .flatMap(m -> manifestFile.read(m.fileName()).stream())
+                            .collect(Collectors.toList());
             for (ManifestEntry entry : entries) {
                 // append delete file are delayed to delete
                 if (entry.kind() == FileKind.DELETE
@@ -661,15 +680,13 @@ private static Set<Path> getSnapshotFileInUse(
     private static Set<Path> getChangelogFileInUse(
             long changelogId,
             SnapshotManager snapshotManager,
-            FileStoreScan scan,
             FileIO fileIO,
             FileStorePathFactory pathFactory,
-            ManifestList manifestList) {
+            ManifestList manifestList,
+            ManifestFile manifestFile) {
         Set<Path> result = new HashSet<>();
         SchemaManager schemaManager = new SchemaManager(fileIO, snapshotManager.tablePath());
         CoreOptions options = new CoreOptions(schemaManager.latest().get().options());
-        boolean produceChangelog =
-                options.changelogProducer() != CoreOptions.ChangelogProducer.NONE;
 
         Path changelogPath = snapshotManager.longLivedChangelogPath(changelogId);
         Changelog changelog = Changelog.fromPath(fileIO, changelogPath);
@@ -677,35 +694,27 @@ private static Set<Path> getChangelogFileInUse(
         // changelog file
         result.add(changelogPath);
 
-        // manifest lists
-        if (!produceChangelog) {
-            result.add(pathFactory.toManifestListPath(changelog.baseManifestList()));
-            result.add(pathFactory.toManifestListPath(changelog.deltaManifestList()));
-        }
-        if (changelog.changelogManifestList() != null) {
-            result.add(pathFactory.toManifestListPath(changelog.changelogManifestList()));
-        }
-
-        // manifests
-        List<ManifestFileMeta> manifests =
-                new ArrayList<>(manifestList.readChangelogManifests(changelog));
-        if (!produceChangelog) {
-            manifests.addAll(manifestList.readDataManifests(changelog));
-        }
-
-        manifests.forEach(m -> result.add(pathFactory.toManifestFilePath(m.fileName())));
-
         // data file
         // not all manifests contains useful data file
         // (1) produceChangelog = 'true': data file in changelog manifests
         // (2) produceChangelog = 'false': 'APPEND' data file in delta manifests
 
         // delta file
-        if (!produceChangelog) {
-            for (ManifestEntry entry :
-                    scan.withManifestList(manifestList.readDeltaManifests(changelog))
-                            .plan()
-                            .files()) {
+        if (options.changelogProducer() == CoreOptions.ChangelogProducer.NONE) {
+            // TODO why we need to keep base manifests?
+            result.add(pathFactory.toManifestListPath(changelog.baseManifestList()));
+            manifestList
+                    .readDataManifests(changelog)
+                    .forEach(m -> result.add(pathFactory.toManifestFilePath(m.fileName())));
+
+            result.add(pathFactory.toManifestListPath(changelog.deltaManifestList()));
+            List<ManifestFileMeta> manifests = manifestList.readDeltaManifests(changelog);
+            manifests.forEach(m -> result.add(pathFactory.toManifestFilePath(m.fileName())));
+            List<ManifestEntry> files =
+                    manifests.stream()
+                            .flatMap(m -> manifestFile.read(m.fileName()).stream())
+                            .collect(Collectors.toList());
+            for (ManifestEntry entry : files) {
                 if (entry.file().fileSource().orElse(FileSource.APPEND) == FileSource.APPEND) {
                     result.add(
                             new Path(
@@ -713,12 +722,15 @@ private static Set<Path> getChangelogFileInUse(
                                     entry.file().fileName()));
                 }
             }
-        } else {
-            // changelog
-            for (ManifestEntry entry :
-                    scan.withManifestList(manifestList.readChangelogManifests(changelog))
-                            .plan()
-                            .files()) {
+        } else if (changelog.changelogManifestList() != null) {
+            result.add(pathFactory.toManifestListPath(changelog.changelogManifestList()));
+            List<ManifestFileMeta> manifests = manifestList.readChangelogManifests(changelog);
+            manifests.forEach(m -> result.add(pathFactory.toManifestFilePath(m.fileName())));
+            List<ManifestEntry> files =
+                    manifests.stream()
+                            .flatMap(m -> manifestFile.read(m.fileName()).stream())
+                            .collect(Collectors.toList());
+            for (ManifestEntry entry : files) {
                 result.add(
                         new Path(
                                 pathFactory.bucketPath(entry.partition(), entry.bucket()),
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
index 739d4b6bd6b32..96dce3d78426a 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
@@ -44,6 +44,7 @@
 
 import org.assertj.core.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.RepeatedTest;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.io.TempDir;
 
@@ -451,7 +452,7 @@ public void testExpireWithUpgradedFile() throws Exception {
         store.assertCleaned();
     }
 
-    @Test
+    @RepeatedTest(5)
     public void testChangelogOutLivedSnapshot() throws Exception {
         List<KeyValue> allData = new ArrayList<>();
         List<Integer> snapshotPositions = new ArrayList<>();
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
index 2fd8c10cd9445..4f3d5c1c24dde 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/KeyValueFileStoreScanTest.java
@@ -26,8 +26,6 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.manifest.ManifestEntry;
-import org.apache.paimon.manifest.ManifestFileMeta;
-import org.apache.paimon.manifest.ManifestList;
 import org.apache.paimon.mergetree.compact.DeduplicateMergeFunction;
 import org.apache.paimon.predicate.PredicateBuilder;
 import org.apache.paimon.schema.Schema;
@@ -252,29 +250,6 @@ public void testWithSnapshot() throws Exception {
         runTestExactMatch(scan, wantedSnapshot, expected);
     }
 
-    @Test
-    public void testWithManifestList() throws Exception {
-        ThreadLocalRandom random = ThreadLocalRandom.current();
-        int numCommits = random.nextInt(10) + 1;
-        for (int i = 0; i < numCommits; i++) {
-            List<KeyValue> data = generateData(random.nextInt(100) + 1);
-            writeData(data);
-        }
-
-        ManifestList manifestList = store.manifestListFactory().create();
-        long wantedSnapshotId = random.nextLong(snapshotManager.latestSnapshotId()) + 1;
-        Snapshot wantedSnapshot = snapshotManager.snapshot(wantedSnapshotId);
-        List<ManifestFileMeta> wantedManifests = manifestList.readDataManifests(wantedSnapshot);
-
-        FileStoreScan scan = store.newScan();
-        scan.withManifestList(wantedManifests);
-
-        List<KeyValue> expectedKvs = store.readKvsFromSnapshot(wantedSnapshotId);
-        gen.sort(expectedKvs);
-        Map<BinaryRow, BinaryRow> expected = store.toKvMap(expectedKvs);
-        runTestExactMatch(scan, null, expected);
-    }
-
     @Test
     public void testDropStatsInPlan() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java b/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
index f6343bfe437f0..4d8408955d380 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
@@ -1473,10 +1473,10 @@ public void testAsyncExpireExecutionMode() throws Exception {
                 TestFileStore.getFilesInUse(
                         latestSnapshotId,
                         snapshotManager,
-                        store.newScan(),
                         table.fileIO(),
                         store.pathFactory(),
-                        store.manifestListFactory().create());
+                        store.manifestListFactory().create(),
+                        store.manifestFileFactory().create());
 
         List<Path> unusedFileList =
                 Files.walk(Paths.get(tempDir.toString()))

From 6e8c03d5825ebad742b8f973043872d437e2aa7c Mon Sep 17 00:00:00 2001
From: LsomeYeah <94825748+LsomeYeah@users.noreply.github.com>
Date: Wed, 20 Nov 2024 16:05:51 +0800
Subject: [PATCH 036/157] [core] all catalogs use 'allow-upper-case' to control
 case-sensitive (#4555)

---
 .../catalog/FileSystemCatalogOptions.java     |  1 +
 .../paimon/catalog/FileSystemCatalogTest.java | 39 ++++++++++++++++++-
 2 files changed, 39 insertions(+), 1 deletion(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/FileSystemCatalogOptions.java b/paimon-core/src/main/java/org/apache/paimon/catalog/FileSystemCatalogOptions.java
index 962b249bac677..e656742b42e92 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/FileSystemCatalogOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/FileSystemCatalogOptions.java
@@ -28,6 +28,7 @@ public final class FileSystemCatalogOptions {
             ConfigOptions.key("case-sensitive")
                     .booleanType()
                     .defaultValue(true)
+                    .withFallbackKeys("allow-upper-case")
                     .withDescription(
                             "Is case sensitive. If case insensitive, you need to set this option to false, and the table name and fields be converted to lowercase.");
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
index 35a5c06ffbc68..798402c6d7dba 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
@@ -19,8 +19,15 @@
 package org.apache.paimon.catalog;
 
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.options.CatalogOptions;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.types.DataTypes;
 
 import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+
+import static org.assertj.core.api.Assertions.assertThatExceptionOfType;
 
 /** Tests for {@link FileSystemCatalog}. */
 public class FileSystemCatalogTest extends CatalogTestBase {
@@ -28,6 +35,36 @@ public class FileSystemCatalogTest extends CatalogTestBase {
     @BeforeEach
     public void setUp() throws Exception {
         super.setUp();
-        catalog = new FileSystemCatalog(fileIO, new Path(warehouse));
+        Options catalogOptions = new Options();
+        catalogOptions.set(CatalogOptions.ALLOW_UPPER_CASE, false);
+        catalog = new FileSystemCatalog(fileIO, new Path(warehouse), catalogOptions);
+    }
+
+    @Test
+    public void testCreateTableAllowUpperCase() throws Exception {
+        catalog.createDatabase("test_db", false);
+        Identifier identifier = Identifier.create("test_db", "new_table");
+        Schema schema =
+                Schema.newBuilder()
+                        .column("Pk1", DataTypes.INT())
+                        .column("pk2", DataTypes.STRING())
+                        .column("pk3", DataTypes.STRING())
+                        .column(
+                                "Col1",
+                                DataTypes.ROW(
+                                        DataTypes.STRING(),
+                                        DataTypes.BIGINT(),
+                                        DataTypes.TIMESTAMP(),
+                                        DataTypes.ARRAY(DataTypes.STRING())))
+                        .column("col2", DataTypes.MAP(DataTypes.STRING(), DataTypes.BIGINT()))
+                        .column("col3", DataTypes.ARRAY(DataTypes.ROW(DataTypes.STRING())))
+                        .partitionKeys("Pk1", "pk2")
+                        .primaryKey("Pk1", "pk2", "pk3")
+                        .build();
+
+        // Create table throws Exception when table is system table
+        assertThatExceptionOfType(IllegalArgumentException.class)
+                .isThrownBy(() -> catalog.createTable(identifier, schema, false))
+                .withMessage("Field name [Pk1, Col1] cannot contain upper case in the catalog.");
     }
 }

From d381e12d0a11d9dac45b3ccf1fc3c5e31e6a344c Mon Sep 17 00:00:00 2001
From: LsomeYeah <94825748+LsomeYeah@users.noreply.github.com>
Date: Wed, 20 Nov 2024 19:20:42 +0800
Subject: [PATCH 037/157] [comments] fix error comments in
 FileSystemCatalogTest (#4557)

---
 .../java/org/apache/paimon/catalog/FileSystemCatalogTest.java   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
index 798402c6d7dba..303a9d8733d4b 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/FileSystemCatalogTest.java
@@ -62,7 +62,7 @@ public void testCreateTableAllowUpperCase() throws Exception {
                         .primaryKey("Pk1", "pk2", "pk3")
                         .build();
 
-        // Create table throws Exception when table is system table
+        // Create table throws Exception if using uppercase when 'allow-upper-case' is false
         assertThatExceptionOfType(IllegalArgumentException.class)
                 .isThrownBy(() -> catalog.createTable(identifier, schema, false))
                 .withMessage("Field name [Pk1, Col1] cannot contain upper case in the catalog.");

From 187825a6a2be1d7cee804e74ec66b423874430c4 Mon Sep 17 00:00:00 2001
From: Yujiang Zhong <42907416+zhongyujiang@users.noreply.github.com>
Date: Thu, 21 Nov 2024 11:22:47 +0800
Subject: [PATCH 038/157] [hive][spark] Support create table with specified
 location using hive catalog (#3843)

---
 .../paimon/catalog/AbstractCatalog.java       | 14 +++
 .../java/org/apache/paimon/schema/Schema.java |  9 --
 .../clone/PickFilesForCloneOperator.java      | 21 ++++-
 .../org/apache/paimon/hive/HiveCatalog.java   | 89 +++++++++++++------
 .../apache/paimon/hive/HiveCatalogTest.java   | 36 ++++++++
 .../org/apache/paimon/spark/SparkCatalog.java |  4 +
 .../org/apache/paimon/spark/SparkTable.scala  |  3 +
 .../apache/paimon/spark/SparkReadITCase.java  | 28 ++++--
 .../paimon/spark/PaimonHiveTestBase.scala     |  1 -
 .../apache/paimon/spark/sql/DDLTestBase.scala | 24 +++++
 .../sql/DDLWithHiveCatalogTestBase.scala      | 50 +++++++++++
 11 files changed, 237 insertions(+), 42 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index 93018f12c9f1b..fff593aabb628 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -133,6 +133,10 @@ public boolean allowUpperCase() {
         return catalogOptions.getOptional(ALLOW_UPPER_CASE).orElse(true);
     }
 
+    protected boolean allowCustomTablePath() {
+        return false;
+    }
+
     @Override
     public void createDatabase(String name, boolean ignoreIfExists, Map<String, String> properties)
             throws DatabaseAlreadyExistException {
@@ -272,6 +276,7 @@ public void createTable(Identifier identifier, Schema schema, boolean ignoreIfEx
         validateIdentifierNameCaseInsensitive(identifier);
         validateFieldNameCaseInsensitive(schema.rowType().getFieldNames());
         validateAutoCreateClose(schema.options());
+        validateCustomTablePath(schema.options());
 
         // check db exists
         getDatabase(identifier.getDatabaseName());
@@ -590,6 +595,15 @@ private void validateAutoCreateClose(Map<String, String> options) {
                         CoreOptions.AUTO_CREATE.key(), Boolean.FALSE));
     }
 
+    private void validateCustomTablePath(Map<String, String> options) {
+        if (!allowCustomTablePath() && options.containsKey(CoreOptions.PATH.key())) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "The current catalog %s does not support specifying the table path when creating a table.",
+                            this.getClass().getSimpleName()));
+        }
+    }
+
     // =============================== Meta in File System =====================================
 
     protected List<String> listDatabasesInFileSystem(Path warehouse) throws IOException {
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/Schema.java b/paimon-core/src/main/java/org/apache/paimon/schema/Schema.java
index 9984e3feef0c8..33309a7cecc91 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/Schema.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/Schema.java
@@ -341,13 +341,4 @@ public Schema build() {
             return new Schema(columns, partitionKeys, primaryKeys, options, comment);
         }
     }
-
-    public static Schema fromTableSchema(TableSchema tableSchema) {
-        return new Schema(
-                tableSchema.fields(),
-                tableSchema.partitionKeys(),
-                tableSchema.primaryKeys(),
-                tableSchema.options(),
-                tableSchema.comment());
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/PickFilesForCloneOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/PickFilesForCloneOperator.java
index 883d7b06ab5f8..67eecbc6f2aea 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/PickFilesForCloneOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/PickFilesForCloneOperator.java
@@ -18,15 +18,21 @@
 
 package org.apache.paimon.flink.clone;
 
+import org.apache.paimon.CoreOptions;
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.flink.FlinkCatalogFactory;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.schema.Schema;
+import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.utils.Preconditions;
 
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.guava30.com.google.common.collect.Iterables;
+
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
@@ -37,6 +43,7 @@
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
+import java.util.Objects;
 
 /**
  * Pick the files to be cloned of a table based on the input record. The record type it produce is
@@ -77,7 +84,7 @@ public void processElement(StreamRecord<Tuple2<String, String>> streamRecord) th
         FileStoreTable sourceTable = (FileStoreTable) sourceCatalog.getTable(sourceIdentifier);
         targetCatalog.createDatabase(targetIdentifier.getDatabaseName(), true);
         targetCatalog.createTable(
-                targetIdentifier, Schema.fromTableSchema(sourceTable.schema()), true);
+                targetIdentifier, newSchemaFromTableSchema(sourceTable.schema()), true);
 
         List<CloneFileInfo> result =
                 toCloneFileInfos(
@@ -95,6 +102,18 @@ public void processElement(StreamRecord<Tuple2<String, String>> streamRecord) th
         }
     }
 
+    private static Schema newSchemaFromTableSchema(TableSchema tableSchema) {
+        return new Schema(
+                ImmutableList.copyOf(tableSchema.fields()),
+                ImmutableList.copyOf(tableSchema.partitionKeys()),
+                ImmutableList.copyOf(tableSchema.primaryKeys()),
+                ImmutableMap.copyOf(
+                        Iterables.filter(
+                                tableSchema.options().entrySet(),
+                                entry -> !Objects.equals(entry.getKey(), CoreOptions.PATH.key()))),
+                tableSchema.comment());
+    }
+
     private List<CloneFileInfo> toCloneFileInfos(
             List<Path> files,
             Path sourceTableRoot,
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index eed0fdb9bff14..93e7e87ef5c79 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -48,6 +48,7 @@
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.Preconditions;
 import org.apache.paimon.view.View;
 import org.apache.paimon.view.ViewImpl;
@@ -83,7 +84,6 @@
 import java.util.HashSet;
 import java.util.LinkedHashMap;
 import java.util.List;
-import java.util.Locale;
 import java.util.Map;
 import java.util.Optional;
 import java.util.Set;
@@ -210,6 +210,20 @@ public Path getTableLocation(Identifier identifier) {
         return getTableLocation(identifier, table);
     }
 
+    private Pair<Path, Boolean> initialTableLocation(
+            Map<String, String> tableOptions, Identifier identifier) {
+        boolean externalTable;
+        Path location;
+        if (tableOptions.containsKey(CoreOptions.PATH.key())) {
+            externalTable = true;
+            location = new Path(tableOptions.get(CoreOptions.PATH.key()));
+        } else {
+            externalTable = usingExternalTable();
+            location = getTableLocation(identifier, null);
+        }
+        return Pair.of(location, externalTable);
+    }
+
     private Path getTableLocation(Identifier identifier, @Nullable Table table) {
         try {
             String databaseName = identifier.getDatabaseName();
@@ -634,8 +648,10 @@ public void createFormatTable(Identifier identifier, Schema schema) {
                         options,
                         schema.comment());
         try {
-            Path location = getTableLocation(identifier, null);
-            Table hiveTable = createHiveFormatTable(identifier, newSchema, location);
+            Pair<Path, Boolean> pair = initialTableLocation(schema.options(), identifier);
+            Path location = pair.getLeft();
+            boolean externalTable = pair.getRight();
+            Table hiveTable = createHiveFormatTable(identifier, newSchema, location, externalTable);
             clients.execute(client -> client.createTable(hiveTable));
         } catch (Exception e) {
             // we don't need to delete directories since HMS will roll back db and fs if failed.
@@ -654,18 +670,19 @@ private boolean usingExternalTable() {
     @Override
     protected void dropTableImpl(Identifier identifier) {
         try {
+            boolean externalTable = isExternalTable(getHmsTable(identifier));
             clients.execute(
                     client ->
                             client.dropTable(
                                     identifier.getDatabaseName(),
                                     identifier.getTableName(),
-                                    true,
+                                    !externalTable,
                                     false,
                                     true));
 
             // When drop a Hive external table, only the hive metadata is deleted and the data files
             // are not deleted.
-            if (usingExternalTable()) {
+            if (externalTable) {
                 return;
             }
 
@@ -680,7 +697,7 @@ protected void dropTableImpl(Identifier identifier) {
             } catch (Exception ee) {
                 LOG.error("Delete directory[{}] fail for table {}", path, identifier, ee);
             }
-        } catch (TException e) {
+        } catch (TException | TableNotExistException e) {
             throw new RuntimeException("Failed to drop table " + identifier.getFullName(), e);
         } catch (InterruptedException e) {
             Thread.currentThread().interrupt();
@@ -691,13 +708,12 @@ protected void dropTableImpl(Identifier identifier) {
 
     @Override
     protected void createTableImpl(Identifier identifier, Schema schema) {
-        // first commit changes to underlying files
-        // if changes on Hive fails there is no harm to perform the same changes to files again
-        Path location = getTableLocation(identifier, null);
+        Pair<Path, Boolean> pair = initialTableLocation(schema.options(), identifier);
+        Path location = pair.getLeft();
+        boolean externalTable = pair.getRight();
         TableSchema tableSchema;
         try {
-            tableSchema =
-                    schemaManager(identifier, location).createTable(schema, usingExternalTable());
+            tableSchema = schemaManager(identifier, location).createTable(schema, externalTable);
         } catch (Exception e) {
             throw new RuntimeException(
                     "Failed to commit changes of table "
@@ -709,7 +725,9 @@ protected void createTableImpl(Identifier identifier, Schema schema) {
         try {
             clients.execute(
                     client ->
-                            client.createTable(createHiveTable(identifier, tableSchema, location)));
+                            client.createTable(
+                                    createHiveTable(
+                                            identifier, tableSchema, location, externalTable)));
         } catch (Exception e) {
             try {
                 fileIO.deleteDirectoryQuietly(location);
@@ -720,7 +738,8 @@ protected void createTableImpl(Identifier identifier, Schema schema) {
         }
     }
 
-    private Table createHiveTable(Identifier identifier, TableSchema tableSchema, Path location) {
+    private Table createHiveTable(
+            Identifier identifier, TableSchema tableSchema, Path location, boolean externalTable) {
         checkArgument(Options.fromMap(tableSchema.options()).get(TYPE) != FORMAT_TABLE);
 
         Map<String, String> tblProperties;
@@ -740,13 +759,14 @@ private Table createHiveTable(Identifier identifier, TableSchema tableSchema, Pa
             }
         }
 
-        Table table = newHmsTable(identifier, tblProperties, PAIMON_TABLE_TYPE_VALUE);
+        Table table =
+                newHmsTable(identifier, tblProperties, PAIMON_TABLE_TYPE_VALUE, externalTable);
         updateHmsTable(table, identifier, tableSchema, PAIMON_TABLE_TYPE_VALUE, location);
         return table;
     }
 
     private Table createHiveFormatTable(
-            Identifier identifier, TableSchema tableSchema, Path location) {
+            Identifier identifier, TableSchema tableSchema, Path location, boolean externalTable) {
         Options options = Options.fromMap(tableSchema.options());
         checkArgument(options.get(TYPE) == FORMAT_TABLE);
 
@@ -757,7 +777,7 @@ private Table createHiveFormatTable(
 
         Map<String, String> tblProperties = new HashMap<>();
 
-        Table table = newHmsTable(identifier, tblProperties, provider);
+        Table table = newHmsTable(identifier, tblProperties, provider, externalTable);
         updateHmsTable(table, identifier, tableSchema, provider, location);
 
         if (FormatTable.Format.CSV.toString().equalsIgnoreCase(provider)) {
@@ -865,6 +885,11 @@ public boolean allowUpperCase() {
         return catalogOptions.getOptional(ALLOW_UPPER_CASE).orElse(false);
     }
 
+    @Override
+    protected boolean allowCustomTablePath() {
+        return true;
+    }
+
     public boolean syncAllProperties() {
         return catalogOptions.get(SYNC_ALL_PROPERTIES);
     }
@@ -921,10 +946,13 @@ public void repairTable(Identifier identifier) throws TableNotExistException {
         TableSchema tableSchema =
                 tableSchemaInFileSystem(location, identifier.getBranchNameOrDefault())
                         .orElseThrow(() -> new TableNotExistException(identifier));
-        Table newTable = createHiveTable(identifier, tableSchema, location);
+
         try {
+            Table newTable = null;
             try {
                 Table table = getHmsTable(identifier);
+                newTable =
+                        createHiveTable(identifier, tableSchema, location, isExternalTable(table));
                 checkArgument(
                         isPaimonTable(table),
                         "Table %s is not a paimon table in hive metastore.",
@@ -935,7 +963,13 @@ public void repairTable(Identifier identifier) throws TableNotExistException {
                 }
             } catch (TableNotExistException e) {
                 // hive table does not exist.
-                clients.execute(client -> client.createTable(newTable));
+                if (newTable == null) {
+                    newTable =
+                            createHiveTable(
+                                    identifier, tableSchema, location, usingExternalTable());
+                }
+                Table finalNewTable = newTable;
+                clients.execute(client -> client.createTable(finalNewTable));
             }
 
             // repair partitions
@@ -1012,13 +1046,16 @@ public static boolean isView(Table table) {
         return table != null && TableType.VIRTUAL_VIEW.name().equals(table.getTableType());
     }
 
+    private boolean isExternalTable(Table table) {
+        return table != null && TableType.EXTERNAL_TABLE.name().equals(table.getTableType());
+    }
+
     private Table newHmsTable(
-            Identifier identifier, Map<String, String> tableParameters, String provider) {
+            Identifier identifier,
+            Map<String, String> tableParameters,
+            String provider,
+            boolean externalTable) {
         long currentTimeMillis = System.currentTimeMillis();
-        CatalogTableType tableType =
-                OptionsUtils.convertToEnum(
-                        hiveConf.get(TABLE_TYPE.key(), CatalogTableType.MANAGED.toString()),
-                        CatalogTableType.class);
         if (provider == null) {
             provider = PAIMON_TABLE_TYPE_VALUE;
         }
@@ -1036,7 +1073,9 @@ private Table newHmsTable(
                         tableParameters,
                         null,
                         null,
-                        tableType.toString().toUpperCase(Locale.ROOT) + "_TABLE");
+                        externalTable
+                                ? TableType.EXTERNAL_TABLE.name()
+                                : TableType.MANAGED_TABLE.name());
         table.getParameters().put(TABLE_TYPE_PROP, provider.toUpperCase());
         if (PAIMON_TABLE_TYPE_VALUE.equalsIgnoreCase(provider)) {
             table.getParameters()
@@ -1045,7 +1084,7 @@ private Table newHmsTable(
             table.getParameters().put(FILE_FORMAT.key(), provider.toLowerCase());
             table.getParameters().put(TYPE.key(), FORMAT_TABLE.toString());
         }
-        if (CatalogTableType.EXTERNAL.equals(tableType)) {
+        if (externalTable) {
             table.getParameters().put("EXTERNAL", "TRUE");
         }
         return table;
diff --git a/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
index dcd770c57f516..3ba3f89e412fc 100644
--- a/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
+++ b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
@@ -18,10 +18,12 @@
 
 package org.apache.paimon.hive;
 
+import org.apache.paimon.CoreOptions;
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.CatalogTestBase;
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.client.ClientPool;
+import org.apache.paimon.options.CatalogOptions;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.schema.Schema;
 import org.apache.paimon.schema.SchemaChange;
@@ -30,6 +32,7 @@
 import org.apache.paimon.utils.CommonTestUtils;
 import org.apache.paimon.utils.HadoopUtils;
 
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
 import org.apache.paimon.shade.guava30.com.google.common.collect.Lists;
 
 import org.apache.hadoop.hive.conf.HiveConf;
@@ -38,6 +41,7 @@
 import org.apache.thrift.TException;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.io.TempDir;
 
 import java.lang.reflect.Field;
 import java.util.ArrayList;
@@ -359,4 +363,36 @@ protected boolean supportsView() {
     protected boolean supportsFormatTable() {
         return true;
     }
+
+    @Test
+    public void testCreateExternalTableWithLocation(@TempDir java.nio.file.Path tempDir)
+            throws Exception {
+        HiveConf hiveConf = new HiveConf();
+        String jdoConnectionURL = "jdbc:derby:memory:" + UUID.randomUUID();
+        hiveConf.setVar(METASTORECONNECTURLKEY, jdoConnectionURL + ";create=true");
+        hiveConf.set(CatalogOptions.TABLE_TYPE.key(), "external");
+        String metastoreClientClass = "org.apache.hadoop.hive.metastore.HiveMetaStoreClient";
+        HiveCatalog externalWarehouseCatalog =
+                new HiveCatalog(fileIO, hiveConf, metastoreClientClass, warehouse);
+
+        String externalTablePath = tempDir.toString();
+
+        Schema schema =
+                new Schema(
+                        Lists.newArrayList(new DataField(0, "foo", DataTypes.INT())),
+                        Collections.emptyList(),
+                        Collections.emptyList(),
+                        ImmutableMap.of("path", externalTablePath),
+                        "");
+
+        Identifier identifier = Identifier.create("default", "my_table");
+        externalWarehouseCatalog.createTable(identifier, schema, true);
+
+        org.apache.paimon.table.Table table = externalWarehouseCatalog.getTable(identifier);
+        assertThat(table.options())
+                .extracting(CoreOptions.PATH.key())
+                .isEqualTo("file:" + externalTablePath);
+
+        externalWarehouseCatalog.close();
+    }
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
index 3b9af1694eef7..5ad1b13b7c7b6 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
@@ -411,6 +411,10 @@ private Schema toInitialSchema(
         }
         normalizedProperties.remove(PRIMARY_KEY_IDENTIFIER);
         normalizedProperties.remove(TableCatalog.PROP_COMMENT);
+        if (normalizedProperties.containsKey(TableCatalog.PROP_LOCATION)) {
+            String path = normalizedProperties.remove(TableCatalog.PROP_LOCATION);
+            normalizedProperties.put(CoreOptions.PATH.key(), path);
+        }
         String pkAsString = properties.get(PRIMARY_KEY_IDENTIFIER);
         List<String> primaryKeys =
                 pkAsString == null
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkTable.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkTable.scala
index 39b1947e4f37b..b9a90d8b5bef2 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkTable.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkTable.scala
@@ -64,6 +64,9 @@ case class SparkTable(table: Table)
         if (table.comment.isPresent) {
           properties.put(TableCatalog.PROP_COMMENT, table.comment.get)
         }
+        if (properties.containsKey(CoreOptions.PATH.key())) {
+          properties.put(TableCatalog.PROP_LOCATION, properties.get(CoreOptions.PATH.key()))
+        }
         properties
       case _ => Collections.emptyMap()
     }
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java b/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
index b4565447c6fc7..b00267410a7fd 100644
--- a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
+++ b/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
@@ -190,17 +190,20 @@ public void testCreateTableAs() {
         spark.sql("INSERT INTO partitionedTable VALUES(1,'aaa','bbb')");
         spark.sql(
                 "CREATE TABLE partitionedTableAs PARTITIONED BY (a) AS SELECT * FROM partitionedTable");
+        Path tablePath = new Path(warehousePath, "default.db/partitionedTableAs");
         assertThat(spark.sql("SHOW CREATE TABLE partitionedTableAs").collectAsList().toString())
                 .isEqualTo(
                         String.format(
                                 "[[%s"
                                         + "PARTITIONED BY (a)\n"
+                                        + "LOCATION '%s'\n"
                                         + "TBLPROPERTIES (\n"
                                         + "  'path' = '%s')\n"
                                         + "]]",
                                 showCreateString(
                                         "partitionedTableAs", "a BIGINT", "b STRING", "c STRING"),
-                                new Path(warehousePath, "default.db/partitionedTableAs")));
+                                tablePath,
+                                tablePath));
         List<Row> resultPartition = spark.sql("SELECT * FROM partitionedTableAs").collectAsList();
         assertThat(resultPartition.stream().map(Row::toString))
                 .containsExactlyInAnyOrder("[1,aaa,bbb]");
@@ -217,17 +220,20 @@ public void testCreateTableAs() {
         spark.sql("INSERT INTO testTable VALUES(1,'a','b')");
         spark.sql(
                 "CREATE TABLE testTableAs TBLPROPERTIES ('file.format' = 'parquet') AS SELECT * FROM testTable");
+        tablePath = new Path(warehousePath, "default.db/testTableAs");
         assertThat(spark.sql("SHOW CREATE TABLE testTableAs").collectAsList().toString())
                 .isEqualTo(
                         String.format(
                                 "[[%s"
+                                        + "LOCATION '%s'\n"
                                         + "TBLPROPERTIES (\n"
                                         + "  'file.format' = 'parquet',\n"
                                         + "  'path' = '%s')\n"
                                         + "]]",
                                 showCreateString(
                                         "testTableAs", "a BIGINT", "b VARCHAR(10)", "c CHAR(10)"),
-                                new Path(warehousePath, "default.db/testTableAs")));
+                                tablePath,
+                                tablePath));
         List<Row> resultProp = spark.sql("SELECT * FROM testTableAs").collectAsList();
 
         assertThat(resultProp.stream().map(Row::toString))
@@ -245,13 +251,17 @@ public void testCreateTableAs() {
                         + "COMMENT 'table comment'");
         spark.sql("INSERT INTO t_pk VALUES(1,'aaa','bbb')");
         spark.sql("CREATE TABLE t_pk_as TBLPROPERTIES ('primary-key' = 'a') AS SELECT * FROM t_pk");
+        tablePath = new Path(warehousePath, "default.db/t_pk_as");
         assertThat(spark.sql("SHOW CREATE TABLE t_pk_as").collectAsList().toString())
                 .isEqualTo(
                         String.format(
-                                "[[%sTBLPROPERTIES (\n  'path' = '%s',\n  'primary-key' = 'a')\n]]",
+                                "[[%s"
+                                        + "LOCATION '%s'\n"
+                                        + "TBLPROPERTIES (\n  'path' = '%s',\n  'primary-key' = 'a')\n]]",
                                 showCreateString(
                                         "t_pk_as", "a BIGINT NOT NULL", "b STRING", "c STRING"),
-                                new Path(warehousePath, "default.db/t_pk_as")));
+                                tablePath,
+                                tablePath));
         List<Row> resultPk = spark.sql("SELECT * FROM t_pk_as").collectAsList();
 
         assertThat(resultPk.stream().map(Row::toString)).containsExactlyInAnyOrder("[1,aaa,bbb]");
@@ -270,11 +280,13 @@ public void testCreateTableAs() {
         spark.sql("INSERT INTO t_all VALUES(1,2,'bbb','2020-01-01','12')");
         spark.sql(
                 "CREATE TABLE t_all_as PARTITIONED BY (dt) TBLPROPERTIES ('primary-key' = 'dt,hh') AS SELECT * FROM t_all");
+        tablePath = new Path(warehousePath, "default.db/t_all_as");
         assertThat(spark.sql("SHOW CREATE TABLE t_all_as").collectAsList().toString())
                 .isEqualTo(
                         String.format(
                                 "[[%s"
                                         + "PARTITIONED BY (dt)\n"
+                                        + "LOCATION '%s'\n"
                                         + "TBLPROPERTIES (\n"
                                         + "  'path' = '%s',\n"
                                         + "  'primary-key' = 'dt,hh')\n"
@@ -286,7 +298,8 @@ public void testCreateTableAs() {
                                         "behavior STRING",
                                         "dt STRING NOT NULL",
                                         "hh STRING NOT NULL"),
-                                new Path(warehousePath, "default.db/t_all_as")));
+                                tablePath,
+                                tablePath));
         List<Row> resultAll = spark.sql("SELECT * FROM t_all_as").collectAsList();
         assertThat(resultAll.stream().map(Row::toString))
                 .containsExactlyInAnyOrder("[1,2,bbb,2020-01-01,12]");
@@ -363,12 +376,14 @@ public void testShowCreateTable() {
                         + "  'k1' = 'v1'\n"
                         + ")");
 
+        Path tablePath = new Path(warehousePath, "default.db/tbl");
         assertThat(spark.sql("SHOW CREATE TABLE tbl").collectAsList().toString())
                 .isEqualTo(
                         String.format(
                                 "[[%s"
                                         + "PARTITIONED BY (b)\n"
                                         + "COMMENT 'tbl comment'\n"
+                                        + "LOCATION '%s'\n"
                                         + "TBLPROPERTIES (\n"
                                         + "  'k1' = 'v1',\n"
                                         + "  'path' = '%s',\n"
@@ -377,7 +392,8 @@ public void testShowCreateTable() {
                                         "tbl",
                                         "a INT NOT NULL COMMENT 'a comment'",
                                         "b STRING NOT NULL"),
-                                new Path(warehousePath, "default.db/tbl")));
+                                tablePath,
+                                tablePath));
     }
 
     @Test
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
index ccd705e269675..842147615d1a7 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.spark
 
-import org.apache.paimon.Snapshot
 import org.apache.paimon.hive.TestHiveMetastore
 
 import org.apache.hadoop.conf.Configuration
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
index cf1a71d51fccb..b09a2be98dc8d 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
@@ -546,4 +546,28 @@ abstract class DDLTestBase extends PaimonSparkTestBase {
         }
     }
   }
+
+  test("Paimon DDL: create and drop external / managed table") {
+    withTempDir {
+      tbLocation =>
+        withTable("external_tbl", "managed_tbl") {
+          // create external table
+          val error = intercept[UnsupportedOperationException] {
+            sql(
+              s"CREATE TABLE external_tbl (id INT) USING paimon LOCATION '${tbLocation.getCanonicalPath}'")
+          }.getMessage
+          assert(error.contains("not support"))
+
+          // create managed table
+          sql("CREATE TABLE managed_tbl (id INT) USING paimon")
+          val table = loadTable("managed_tbl")
+          val fileIO = table.fileIO()
+          val tableLocation = table.location()
+
+          // drop managed table
+          sql("DROP TABLE managed_tbl")
+          assert(!fileIO.exists(tableLocation))
+        }
+    }
+  }
 }
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index 56922ae2aeff8..bfd6716b21282 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -297,6 +297,56 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
     }
   }
 
+  test("Paimon DDL with hive catalog: create and drop external / managed table") {
+    Seq(sparkCatalogName, paimonHiveCatalogName).foreach {
+      catalogName =>
+        spark.sql(s"USE $catalogName")
+        withTempDir {
+          tbLocation =>
+            withDatabase("paimon_db") {
+              spark.sql(s"CREATE DATABASE paimon_db")
+              spark.sql(s"USE paimon_db")
+              withTable("external_tbl", "managed_tbl") {
+                val expertTbLocation = tbLocation.getCanonicalPath
+                // create external table
+                spark.sql(
+                  s"CREATE TABLE external_tbl (id INT) USING paimon LOCATION '$expertTbLocation'")
+                spark.sql("INSERT INTO external_tbl VALUES (1)")
+                checkAnswer(spark.sql("SELECT * FROM external_tbl"), Row(1))
+                val table = loadTable("paimon_db", "external_tbl")
+                val fileIO = table.fileIO()
+                val actualTbLocation = table.location()
+                assert(actualTbLocation.toString.split(':').apply(1).equals(expertTbLocation))
+
+                // drop external table
+                spark.sql("DROP TABLE external_tbl")
+                assert(fileIO.exists(actualTbLocation))
+
+                // create external table again using the same location
+                spark.sql(
+                  s"CREATE TABLE external_tbl (id INT) USING paimon LOCATION '$expertTbLocation'")
+                checkAnswer(spark.sql("SELECT * FROM external_tbl"), Row(1))
+                assert(
+                  loadTable("paimon_db", "external_tbl")
+                    .location()
+                    .toString
+                    .split(':')
+                    .apply(1)
+                    .equals(expertTbLocation))
+
+                // create managed table
+                spark.sql(s"CREATE TABLE managed_tbl (id INT) USING paimon")
+                val managedTbLocation = loadTable("paimon_db", "managed_tbl").location()
+
+                // drop managed table
+                spark.sql("DROP TABLE managed_tbl")
+                assert(!fileIO.exists(managedTbLocation))
+              }
+            }
+        }
+    }
+  }
+
   def getDatabaseProp(dbName: String, propertyName: String): String = {
     spark
       .sql(s"DESC DATABASE EXTENDED $dbName")

From 499afd97bd8e64c38b7b389227ba48cbd1ce8e4b Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Thu, 21 Nov 2024 13:22:19 +0800
Subject: [PATCH 039/157] [flink] Fix that dim table cannot refresh overwrite
 changes (#4558)

---
 .../table/source/DataTableStreamScan.java     | 32 +++++++++++++------
 .../flink/lookup/FileStoreLookupFunction.java |  2 +-
 .../flink/lookup/LookupDataTableScan.java     | 13 ++++++++
 .../paimon/flink/lookup/ReopenException.java  | 29 +++++++++++++++++
 .../apache/paimon/flink/LookupJoinITCase.java | 29 +++++++++++++++++
 5 files changed, 94 insertions(+), 11 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/ReopenException.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableStreamScan.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableStreamScan.java
index a68c7b1cb46d7..e8c4ddfa1c7c4 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableStreamScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableStreamScan.java
@@ -194,16 +194,16 @@ private Plan nextPlan() {
                 return SnapshotNotExistPlan.INSTANCE;
             }
 
-            // first check changes of overwrite
-            if (snapshot.commitKind() == Snapshot.CommitKind.OVERWRITE
-                    && supportStreamingReadOverwrite) {
-                LOG.debug("Find overwrite snapshot id {}.", nextSnapshotId);
-                SnapshotReader.Plan overwritePlan =
-                        followUpScanner.getOverwriteChangesPlan(snapshot, snapshotReader);
-                currentWatermark = overwritePlan.watermark();
-                nextSnapshotId++;
-                return overwritePlan;
-            } else if (followUpScanner.shouldScanSnapshot(snapshot)) {
+            // first try to get overwrite changes
+            if (snapshot.commitKind() == Snapshot.CommitKind.OVERWRITE) {
+                SnapshotReader.Plan overwritePlan = handleOverwriteSnapshot(snapshot);
+                if (overwritePlan != null) {
+                    nextSnapshotId++;
+                    return overwritePlan;
+                }
+            }
+
+            if (followUpScanner.shouldScanSnapshot(snapshot)) {
                 LOG.debug("Find snapshot id {}.", nextSnapshotId);
                 SnapshotReader.Plan plan = followUpScanner.scan(snapshot, snapshotReader);
                 currentWatermark = plan.watermark();
@@ -228,6 +228,18 @@ private boolean shouldDelaySnapshot(long snapshotId) {
         return false;
     }
 
+    @Nullable
+    protected SnapshotReader.Plan handleOverwriteSnapshot(Snapshot snapshot) {
+        if (supportStreamingReadOverwrite) {
+            LOG.debug("Find overwrite snapshot id {}.", nextSnapshotId);
+            SnapshotReader.Plan overwritePlan =
+                    followUpScanner.getOverwriteChangesPlan(snapshot, snapshotReader);
+            currentWatermark = overwritePlan.watermark();
+            return overwritePlan;
+        }
+        return null;
+    }
+
     protected FollowUpScanner createFollowUpScanner() {
         CoreOptions.StreamScanMode type =
                 options.toConfiguration().get(CoreOptions.STREAM_SCAN_MODE);
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/FileStoreLookupFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/FileStoreLookupFunction.java
index 9503960fbe17b..e3f2fe110c6c3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/FileStoreLookupFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/FileStoreLookupFunction.java
@@ -249,7 +249,7 @@ public Collection<RowData> lookup(RowData keyRow) {
                 rows.add(new FlinkRowData(matchedRow));
             }
             return rows;
-        } catch (OutOfRangeException e) {
+        } catch (OutOfRangeException | ReopenException e) {
             reopen();
             return lookup(keyRow);
         } catch (Exception e) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
index 908884a573c0f..48cb64e70be17 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.flink.lookup;
 
 import org.apache.paimon.CoreOptions;
+import org.apache.paimon.Snapshot;
 import org.apache.paimon.operation.DefaultValueAssigner;
 import org.apache.paimon.table.source.DataTableStreamScan;
 import org.apache.paimon.table.source.snapshot.AllDeltaFollowUpScanner;
@@ -29,6 +30,8 @@
 import org.apache.paimon.table.source.snapshot.StartingScanner;
 import org.apache.paimon.utils.SnapshotManager;
 
+import javax.annotation.Nullable;
+
 import static org.apache.paimon.CoreOptions.StartupMode;
 import static org.apache.paimon.flink.lookup.LookupFileStoreTable.LookupStreamScanMode;
 
@@ -58,6 +61,16 @@ public LookupDataTableScan(
         this.lookupScanMode = lookupScanMode;
     }
 
+    @Override
+    @Nullable
+    protected SnapshotReader.Plan handleOverwriteSnapshot(Snapshot snapshot) {
+        SnapshotReader.Plan plan = super.handleOverwriteSnapshot(snapshot);
+        if (plan != null) {
+            return plan;
+        }
+        throw new ReopenException();
+    }
+
     @Override
     protected StartingScanner createStartingScanner(boolean isStreaming) {
         return startupMode != CoreOptions.StartupMode.COMPACTED_FULL
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/ReopenException.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/ReopenException.java
new file mode 100644
index 0000000000000..7149d591f8dfd
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/ReopenException.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.lookup;
+
+/** Signals that dim table source need to reopen. */
+public class ReopenException extends RuntimeException {
+
+    private static final long serialVersionUID = 1L;
+
+    public ReopenException() {
+        super();
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/LookupJoinITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/LookupJoinITCase.java
index 3e9ba2194aed4..a6abde57b80c8 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/LookupJoinITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/LookupJoinITCase.java
@@ -25,6 +25,7 @@
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.EnumSource;
+import org.junit.jupiter.params.provider.ValueSource;
 
 import java.util.Collections;
 import java.util.List;
@@ -977,4 +978,32 @@ public void testPartialCacheBucketKeyOrder(LookupCacheMode mode) throws Exceptio
 
         iterator.close();
     }
+
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testOverwriteDimTable(boolean isPkTable) throws Exception {
+        sql(
+                "CREATE TABLE DIM (i INT %s, v int, pt STRING) "
+                        + "PARTITIONED BY (pt) WITH ('continuous.discovery-interval'='1 ms')",
+                isPkTable ? "PRIMARY KEY NOT ENFORCED" : "");
+
+        BlockingIterator<Row, Row> iterator =
+                streamSqlBlockIter(
+                        "SELECT T.i, D.v, D.pt FROM T LEFT JOIN DIM FOR SYSTEM_TIME AS OF T.proctime AS D ON T.i = D.i");
+
+        sql("INSERT INTO DIM VALUES (1, 11, 'A'), (2, 22, 'B')");
+        sql("INSERT INTO T VALUES (1), (2)");
+
+        List<Row> result = iterator.collect(2);
+        assertThat(result).containsExactlyInAnyOrder(Row.of(1, 11, "A"), Row.of(2, 22, "B"));
+
+        sql("INSERT OVERWRITE DIM PARTITION (pt='B') VALUES (3, 33)");
+        Thread.sleep(2000); // wait refresh
+        sql("INSERT INTO T VALUES (3)");
+
+        result = iterator.collect(1);
+        assertThat(result).containsExactlyInAnyOrder(Row.of(3, 33, "B"));
+
+        iterator.close();
+    }
 }

From dd1d53a52d0e9a2809357253f2ba79e20fcae102 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Thu, 21 Nov 2024 15:34:02 +0800
Subject: [PATCH 040/157] [test] Avoid table name duplication in
 HiveWriteITCase (#4563)

---
 .../src/test/java/org/apache/paimon/hive/HiveWriteITCase.java   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveWriteITCase.java b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveWriteITCase.java
index 57486ec30be9f..c99eb9cd1f461 100644
--- a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveWriteITCase.java
+++ b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveWriteITCase.java
@@ -157,7 +157,7 @@ private String writeData(Table table, String path, List<InternalRow> data) throw
         write.close();
         commit.close();
 
-        String tableName = "test_table_" + (UUID.randomUUID().toString().substring(0, 4));
+        String tableName = "test_table_" + UUID.randomUUID().toString().replace('-', '_');
         hiveShell.execute(
                 String.join(
                         "\n",

From a47f77f0dfb077a3e7628a7c8dc9c2df19cc6e81 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Thu, 21 Nov 2024 15:34:22 +0800
Subject: [PATCH 041/157] [hive] Rename hive external table should not change
 table path (#4562)

---
 .../org/apache/paimon/hive/HiveCatalog.java   | 10 ++--
 .../sql/DDLWithHiveCatalogTestBase.scala      | 54 +++++++++++++++++++
 2 files changed, 60 insertions(+), 4 deletions(-)

diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 93e7e87ef5c79..e936587320f3f 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -792,13 +792,15 @@ private Table createHiveFormatTable(
     @Override
     protected void renameTableImpl(Identifier fromTable, Identifier toTable) {
         try {
-            Table table = renameHiveTable(fromTable, toTable);
-
+            // Get fromTable's location before rename
             Path fromPath = getTableLocation(fromTable);
-            if (!new SchemaManager(fileIO, fromPath).listAllIds().isEmpty()) {
+            Table table = renameHiveTable(fromTable, toTable);
+            Path toPath = getTableLocation(toTable);
+            if (!isExternalTable(table)
+                    && !fromPath.equals(toPath)
+                    && !new SchemaManager(fileIO, fromPath).listAllIds().isEmpty()) {
                 // Rename the file system's table directory. Maintain consistency between tables in
                 // the file system and tables in the Hive Metastore.
-                Path toPath = getTableLocation(toTable);
                 try {
                     fileIO.rename(fromPath, toPath);
                 } catch (IOException e) {
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index bfd6716b21282..9be8e21a8df2d 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -347,6 +347,60 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
     }
   }
 
+  test("Paimon DDL with hive catalog: rename external / managed table") {
+    Seq(sparkCatalogName, paimonHiveCatalogName).foreach {
+      catalogName =>
+        spark.sql(s"USE $catalogName")
+        withTempDir {
+          tbLocation =>
+            withDatabase("paimon_db") {
+              spark.sql(s"CREATE DATABASE paimon_db")
+              spark.sql(s"USE paimon_db")
+              withTable(
+                "external_tbl",
+                "managed_tbl",
+                "external_tbl_renamed",
+                "managed_tbl_renamed") {
+                val expertTbLocation = tbLocation.getCanonicalPath
+                // create external table
+                spark.sql(
+                  s"CREATE TABLE external_tbl (id INT) USING paimon LOCATION '$expertTbLocation'")
+                spark.sql("INSERT INTO external_tbl VALUES (1)")
+                val actualTbLocation = loadTable("paimon_db", "external_tbl").location()
+                assert(actualTbLocation.toString.split(':').apply(1).equals(expertTbLocation))
+
+                // rename external table, location should not change
+                spark.sql("ALTER TABLE external_tbl RENAME TO external_tbl_renamed")
+                checkAnswer(spark.sql("SELECT * FROM external_tbl_renamed"), Row(1))
+                assert(
+                  loadTable("paimon_db", "external_tbl_renamed")
+                    .location()
+                    .toString
+                    .split(':')
+                    .apply(1)
+                    .equals(expertTbLocation))
+
+                // create managed table
+                spark.sql(s"CREATE TABLE managed_tbl (id INT) USING paimon")
+                spark.sql("INSERT INTO managed_tbl VALUES (1)")
+                val managedTbLocation = loadTable("paimon_db", "managed_tbl").location()
+
+                // rename managed table, location should change
+                spark.sql("ALTER TABLE managed_tbl RENAME TO managed_tbl_renamed")
+                checkAnswer(spark.sql("SELECT * FROM managed_tbl_renamed"), Row(1))
+                assert(
+                  !loadTable("paimon_db", "managed_tbl_renamed")
+                    .location()
+                    .toString
+                    .split(':')
+                    .apply(1)
+                    .equals(managedTbLocation.toString))
+              }
+            }
+        }
+    }
+  }
+
   def getDatabaseProp(dbName: String, propertyName: String): String = {
     spark
       .sql(s"DESC DATABASE EXTENDED $dbName")

From 89f97c7baf59b72a5bc747e6f5391973fac5d3f5 Mon Sep 17 00:00:00 2001
From: JackeyLee007 <JackeyLee007@126.com>
Date: Thu, 21 Nov 2024 22:22:56 +0800
Subject: [PATCH 042/157] [cdc] support aliyun-json when sinking data from
 kafka with paimon-flink-action (#4570)

---
 .../cdc/format/aliyun/AliyunDataFormat.java   |  34 +++
 .../aliyun/AliyunDataFormatFactory.java}      |  23 +-
 .../cdc/format/aliyun/AliyunFieldParser.java  | 117 ++++++++
 .../cdc/format/aliyun/AliyunRecordParser.java | 260 ++++++++++++++++++
 .../MessageQueueCdcTimestampExtractor.java    |   4 +
 .../org.apache.paimon.factories.Factory       |   1 +
 .../aliyun/AliyunJsonRecordParserTest.java    | 167 +++++++++++
 .../kafka/aliyun/table/event/event-delete.txt |  19 ++
 .../kafka/aliyun/table/event/event-insert.txt |  19 ++
 .../table/event/event-update-in-one.txt       |  19 ++
 10 files changed, 655 insertions(+), 8 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormat.java
 rename paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/{ProcessRecordAttributesUtil.java => action/cdc/format/aliyun/AliyunDataFormatFactory.java} (59%)
 create mode 100644 paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunFieldParser.java
 create mode 100644 paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunRecordParser.java
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunJsonRecordParserTest.java
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-delete.txt
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-insert.txt
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-update-in-one.txt

diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormat.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormat.java
new file mode 100644
index 0000000000000..ccbacdc2af5e7
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormat.java
@@ -0,0 +1,34 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc.format.aliyun;
+
+import org.apache.paimon.flink.action.cdc.format.AbstractJsonDataFormat;
+import org.apache.paimon.flink.action.cdc.format.RecordParserFactory;
+
+/**
+ * Supports the message queue's debezium json data format and provides definitions for the message
+ * queue's record json deserialization class and parsing class {@link AliyunRecordParser}.
+ */
+public class AliyunDataFormat extends AbstractJsonDataFormat {
+
+    @Override
+    protected RecordParserFactory parser() {
+        return AliyunRecordParser::new;
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/ProcessRecordAttributesUtil.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormatFactory.java
similarity index 59%
rename from paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/ProcessRecordAttributesUtil.java
rename to paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormatFactory.java
index efe5e12b12d70..a07e2f205c904 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/ProcessRecordAttributesUtil.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunDataFormatFactory.java
@@ -16,16 +16,23 @@
  * limitations under the License.
  */
 
-package org.apache.paimon.flink;
+package org.apache.paimon.flink.action.cdc.format.aliyun;
 
-import org.apache.paimon.flink.sink.StoreSinkWrite;
+import org.apache.paimon.flink.action.cdc.format.DataFormat;
+import org.apache.paimon.flink.action.cdc.format.DataFormatFactory;
 
-import org.apache.flink.streaming.api.operators.Output;
-import org.apache.flink.streaming.runtime.streamrecord.RecordAttributes;
+/** Factory to create {@link AliyunDataFormat}. */
+public class AliyunDataFormatFactory implements DataFormatFactory {
 
-/** Placeholder class for new feature introduced since flink 1.19. Should never be used. */
-public class ProcessRecordAttributesUtil {
-    public static void processWithWrite(RecordAttributes recordAttributes, StoreSinkWrite write) {}
+    public static final String IDENTIFIER = "aliyun-json";
 
-    public static void processWithOutput(RecordAttributes recordAttributes, Output output) {}
+    @Override
+    public String identifier() {
+        return IDENTIFIER;
+    }
+
+    @Override
+    public DataFormat create() {
+        return new AliyunDataFormat();
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunFieldParser.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunFieldParser.java
new file mode 100644
index 0000000000000..824ed91459430
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunFieldParser.java
@@ -0,0 +1,117 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc.format.aliyun;
+
+/** Converts some special types such as enum、set、geometry. */
+public class AliyunFieldParser {
+
+    protected static byte[] convertGeoType2WkbArray(byte[] mysqlGeomBytes) {
+        int sridLength = 4;
+        boolean hasSrid = false;
+        for (int i = 0; i < sridLength; ++i) {
+            if (mysqlGeomBytes[i] != 0) {
+                hasSrid = true;
+                break;
+            }
+        }
+        byte[] wkb;
+        if (hasSrid) {
+            wkb = new byte[mysqlGeomBytes.length];
+            // byteOrder + geometry
+            System.arraycopy(mysqlGeomBytes, 4, wkb, 0, 5);
+            // srid
+            System.arraycopy(mysqlGeomBytes, 0, wkb, 5, 4);
+            // geometry
+            System.arraycopy(mysqlGeomBytes, 9, wkb, 9, wkb.length - 9);
+
+            // set srid flag
+            if (wkb[0] == 0) {
+                // big endian
+                wkb[1] = (byte) (wkb[1] + 32);
+            } else {
+                wkb[4] = (byte) (wkb[4] + 32);
+            }
+        } else {
+            wkb = new byte[mysqlGeomBytes.length - 4];
+            System.arraycopy(mysqlGeomBytes, 4, wkb, 0, wkb.length);
+        }
+        return wkb;
+    }
+
+    protected static String convertSet(String value, String mysqlType) {
+        // mysql set type value can be filled with more than one, value is a bit string conversion
+        // from the long
+        int indexes = Integer.parseInt(value);
+        return getSetValuesByIndex(mysqlType, indexes);
+    }
+
+    protected static String convertEnum(String value, String mysqlType) {
+        int elementIndex = Integer.parseInt(value);
+        // enum('a','b','c')
+        return getEnumValueByIndex(mysqlType, elementIndex);
+    }
+
+    protected static String getEnumValueByIndex(String mysqlType, int elementIndex) {
+        String[] options = extractEnumValueByIndex(mysqlType);
+
+        return options[elementIndex - 1];
+    }
+
+    protected static String getSetValuesByIndex(String mysqlType, int indexes) {
+        String[] options = extractSetValuesByIndex(mysqlType);
+
+        StringBuilder sb = new StringBuilder();
+        sb.append("[");
+        int index = 0;
+        boolean first = true;
+        int optionLen = options.length;
+
+        while (indexes != 0L) {
+            if (indexes % 2L != 0) {
+                if (first) {
+                    first = false;
+                } else {
+                    sb.append(',');
+                }
+                if (index < optionLen) {
+                    sb.append(options[index]);
+                } else {
+                    throw new RuntimeException(
+                            String.format(
+                                    "extractSetValues from mysqlType[%s],index:%d failed",
+                                    mysqlType, indexes));
+                }
+            }
+            ++index;
+            indexes = indexes >>> 1;
+        }
+        sb.append("]");
+        return sb.toString();
+    }
+
+    private static String[] extractSetValuesByIndex(String mysqlType) {
+        // set('x','y')
+        return mysqlType.substring(5, mysqlType.length() - 2).split("'\\s*,\\s*'");
+    }
+
+    private static String[] extractEnumValueByIndex(String mysqlType) {
+        // enum('x','y')
+        return mysqlType.substring(6, mysqlType.length() - 2).split("'\\s*,\\s*'");
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunRecordParser.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunRecordParser.java
new file mode 100644
index 0000000000000..e31b282a76cb3
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunRecordParser.java
@@ -0,0 +1,260 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc.format.aliyun;
+
+import org.apache.paimon.flink.action.cdc.ComputedColumn;
+import org.apache.paimon.flink.action.cdc.TypeMapping;
+import org.apache.paimon.flink.action.cdc.format.AbstractJsonRecordParser;
+import org.apache.paimon.flink.action.cdc.mysql.MySqlTypeUtils;
+import org.apache.paimon.flink.sink.cdc.RichCdcMultiplexRecord;
+import org.apache.paimon.types.RowKind;
+import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.JsonSerdeUtil;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.core.type.TypeReference;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.JsonNode;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.node.ArrayNode;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import javax.annotation.Nullable;
+
+import java.nio.charset.StandardCharsets;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import static org.apache.paimon.utils.JsonSerdeUtil.getNodeAs;
+import static org.apache.paimon.utils.JsonSerdeUtil.isNull;
+
+/**
+ * The {@code CanalRecordParser} class is responsible for parsing records from the Canal-JSON
+ * format. Canal is a database binlog multi-platform consumer, which is used to synchronize data
+ * across databases. This parser extracts relevant information from the Canal-JSON format and
+ * transforms it into a list of {@link RichCdcMultiplexRecord} objects, which represent the changes
+ * captured in the database.
+ *
+ * <p>The class handles different types of database operations such as INSERT, UPDATE, and DELETE,
+ * and generates corresponding {@link RichCdcMultiplexRecord} objects for each operation.
+ *
+ * <p>Additionally, the parser supports schema extraction, which can be used to understand the
+ * structure of the incoming data and its corresponding field types.
+ */
+public class AliyunRecordParser extends AbstractJsonRecordParser {
+
+    private static final Logger LOG = LoggerFactory.getLogger(AliyunRecordParser.class);
+
+    private static final String FIELD_IS_DDL = "isDdl";
+    private static final String FIELD_TYPE = "op";
+
+    private static final String OP_UPDATE_BEFORE = "UPDATE_BEFORE";
+    private static final String OP_UPDATE_AFTER = "UPDATE_AFTER";
+    private static final String OP_INSERT = "INSERT";
+    private static final String OP_DELETE = "DELETE";
+
+    private static final String FIELD_PAYLOAD = "payload";
+    private static final String FIELD_BEFORE = "before";
+    private static final String FIELD_AFTER = "after";
+    private static final String FIELD_COLUMN = "dataColumn";
+
+    private static final String FIELD_SCHEMA = "schema";
+    private static final String FIELD_PK = "primaryKey";
+
+    @Override
+    protected boolean isDDL() {
+        JsonNode node = root.get(FIELD_IS_DDL);
+        return !isNull(node) && node.asBoolean();
+    }
+
+    public AliyunRecordParser(TypeMapping typeMapping, List<ComputedColumn> computedColumns) {
+        super(typeMapping, computedColumns);
+    }
+
+    @Override
+    protected String primaryField() {
+        return "schema.primaryKey";
+    }
+
+    @Override
+    protected String dataField() {
+        return "payload.dataColumn";
+    }
+
+    @Override
+    protected List<String> extractPrimaryKeys() {
+        JsonNode schemaNode = root.get(FIELD_SCHEMA);
+        checkNotNull(schemaNode, FIELD_SCHEMA);
+        ArrayNode pkNode = getNodeAs(schemaNode, FIELD_PK, ArrayNode.class);
+        List<String> pkFields = new ArrayList<>();
+        pkNode.forEach(
+                pk -> {
+                    if (isNull(pk)) {
+                        throw new IllegalArgumentException(
+                                String.format("Primary key cannot be null: %s", pk));
+                    }
+
+                    pkFields.add(pk.asText());
+                });
+        return pkFields;
+    }
+
+    @Override
+    public List<RichCdcMultiplexRecord> extractRecords() {
+        if (isDDL()) {
+            return Collections.emptyList();
+        }
+
+        List<RichCdcMultiplexRecord> records = new ArrayList<>();
+
+        JsonNode payload = root.get(FIELD_PAYLOAD);
+        checkNotNull(payload, FIELD_PAYLOAD);
+
+        String type = payload.get(FIELD_TYPE).asText();
+
+        RowKind rowKind = null;
+        String field = null;
+        switch (type) {
+            case OP_UPDATE_BEFORE:
+                rowKind = RowKind.UPDATE_BEFORE;
+                field = FIELD_BEFORE;
+                break;
+            case OP_UPDATE_AFTER:
+                rowKind = RowKind.UPDATE_AFTER;
+                field = FIELD_AFTER;
+                break;
+            case OP_INSERT:
+                rowKind = RowKind.INSERT;
+                field = FIELD_AFTER;
+                break;
+            case OP_DELETE:
+                rowKind = RowKind.DELETE;
+                field = FIELD_BEFORE;
+                break;
+            default:
+                throw new UnsupportedOperationException("Unknown record operation: " + type);
+        }
+
+        JsonNode container = payload.get(field);
+        checkNotNull(container, String.format("%s.%s", FIELD_PAYLOAD, field));
+
+        JsonNode data = getNodeAs(container, FIELD_COLUMN, JsonNode.class);
+        checkNotNull(data, String.format("%s.%s.%s", FIELD_PAYLOAD, field, FIELD_COLUMN));
+
+        processRecord(data, rowKind, records);
+
+        return records;
+    }
+
+    @Override
+    protected Map<String, String> extractRowData(JsonNode record, RowType.Builder rowTypeBuilder) {
+
+        Map<String, Object> recordMap =
+                JsonSerdeUtil.convertValue(record, new TypeReference<Map<String, Object>>() {});
+        Map<String, String> rowData = new HashMap<>();
+
+        fillDefaultTypes(record, rowTypeBuilder);
+        for (Map.Entry<String, Object> entry : recordMap.entrySet()) {
+            rowData.put(entry.getKey(), Objects.toString(entry.getValue(), null));
+        }
+
+        evalComputedColumns(rowData, rowTypeBuilder);
+        return rowData;
+    }
+
+    @Override
+    protected String format() {
+        return "aliyun-json";
+    }
+
+    @Nullable
+    @Override
+    protected String getTableName() {
+        JsonNode schemaNode = root.get(FIELD_SCHEMA);
+        if (isNull(schemaNode)) {
+            return null;
+        }
+        JsonNode sourceNode = schemaNode.get("source");
+        if (isNull(sourceNode)) {
+            return null;
+        }
+
+        JsonNode tableNode = sourceNode.get("tableName");
+        if (isNull(tableNode)) {
+            return null;
+        }
+        return tableNode.asText();
+    }
+
+    @Nullable
+    @Override
+    protected String getDatabaseName() {
+        JsonNode schemaNode = root.get(FIELD_SCHEMA);
+        if (isNull(schemaNode)) {
+            return null;
+        }
+        JsonNode sourceNode = schemaNode.get("source");
+        if (isNull(sourceNode)) {
+            return null;
+        }
+        JsonNode databaseNode = sourceNode.get("dbName");
+        if (isNull(databaseNode)) {
+            return null;
+        }
+        return databaseNode.asText();
+    }
+
+    private Map<JsonNode, JsonNode> matchOldRecords(ArrayNode newData, ArrayNode oldData) {
+        return IntStream.range(0, newData.size())
+                .boxed()
+                .collect(Collectors.toMap(newData::get, oldData::get));
+    }
+
+    private String transformValue(@Nullable String oldValue, String shortType, String mySqlType) {
+        if (oldValue == null) {
+            return null;
+        }
+
+        if (MySqlTypeUtils.isSetType(shortType)) {
+            return AliyunFieldParser.convertSet(oldValue, mySqlType);
+        }
+
+        if (MySqlTypeUtils.isEnumType(shortType)) {
+            return AliyunFieldParser.convertEnum(oldValue, mySqlType);
+        }
+
+        if (MySqlTypeUtils.isGeoType(shortType)) {
+            try {
+                byte[] wkb =
+                        AliyunFieldParser.convertGeoType2WkbArray(
+                                oldValue.getBytes(StandardCharsets.ISO_8859_1));
+                return MySqlTypeUtils.convertWkbArray(wkb);
+            } catch (Exception e) {
+                throw new IllegalArgumentException(
+                        String.format("Failed to convert %s to geometry JSON.", oldValue), e);
+            }
+        }
+        return oldValue;
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/watermark/MessageQueueCdcTimestampExtractor.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/watermark/MessageQueueCdcTimestampExtractor.java
index 8a9a28453badf..5bf2fefc1b78a 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/watermark/MessageQueueCdcTimestampExtractor.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/watermark/MessageQueueCdcTimestampExtractor.java
@@ -54,6 +54,10 @@ public long extractTimestamp(CdcSourceRecord cdcSourceRecord) throws JsonProcess
         } else if (JsonSerdeUtil.isNodeExists(record, "source", "connector")) {
             // Dbz json
             return JsonSerdeUtil.extractValue(record, Long.class, "ts_ms");
+        } else if (JsonSerdeUtil.isNodeExists(record, "payload", "timestamp")) {
+            // Aliyun json
+            return JsonSerdeUtil.extractValue(
+                    record, Long.class, "payload", "timestamp", "systemTime");
         }
         throw new RuntimeException(
                 String.format(
diff --git a/paimon-flink/paimon-flink-cdc/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory b/paimon-flink/paimon-flink-cdc/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
index 17b8b29a20099..1b30c7ab63960 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
+++ b/paimon-flink/paimon-flink-cdc/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
@@ -27,6 +27,7 @@ org.apache.paimon.flink.action.cdc.mongodb.MongoDBSyncDatabaseActionFactory
 org.apache.paimon.flink.action.cdc.postgres.PostgresSyncTableActionFactory
 
 ### message queue data format factories
+org.apache.paimon.flink.action.cdc.format.aliyun.AliyunDataFormatFactory
 org.apache.paimon.flink.action.cdc.format.canal.CanalDataFormatFactory
 org.apache.paimon.flink.action.cdc.format.debezium.DebeziumAvroDataFormatFactory
 org.apache.paimon.flink.action.cdc.format.debezium.DebeziumJsonDataFormatFactory
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunJsonRecordParserTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunJsonRecordParserTest.java
new file mode 100644
index 0000000000000..f06268d700e5e
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/format/aliyun/AliyunJsonRecordParserTest.java
@@ -0,0 +1,167 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc.format.aliyun;
+
+import org.apache.paimon.flink.action.cdc.CdcSourceRecord;
+import org.apache.paimon.flink.action.cdc.TypeMapping;
+import org.apache.paimon.flink.action.cdc.kafka.KafkaActionITCaseBase;
+import org.apache.paimon.flink.action.cdc.watermark.MessageQueueCdcTimestampExtractor;
+import org.apache.paimon.flink.sink.cdc.CdcRecord;
+import org.apache.paimon.flink.sink.cdc.RichCdcMultiplexRecord;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.types.RowKind;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.JsonNode;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import java.net.URL;
+import java.nio.file.Files;
+import java.nio.file.Paths;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+
+/** Test for AliyunJsonRecordParser. */
+public class AliyunJsonRecordParserTest extends KafkaActionITCaseBase {
+
+    private static final Logger log = LoggerFactory.getLogger(AliyunJsonRecordParserTest.class);
+    private static List<String> insertList = new ArrayList<>();
+    private static List<String> updateList = new ArrayList<>();
+    private static List<String> deleteList = new ArrayList<>();
+
+    private static ObjectMapper objMapper = new ObjectMapper();
+
+    @Before
+    public void setup() {
+        String insertRes = "kafka/aliyun/table/event/event-insert.txt";
+        String updateRes = "kafka/aliyun/table/event/event-update-in-one.txt";
+        String deleteRes = "kafka/aliyun/table/event/event-delete.txt";
+        URL url;
+        try {
+            url = AliyunJsonRecordParserTest.class.getClassLoader().getResource(insertRes);
+            Files.readAllLines(Paths.get(url.toURI())).stream()
+                    .filter(this::isRecordLine)
+                    .forEach(e -> insertList.add(e));
+
+            url = AliyunJsonRecordParserTest.class.getClassLoader().getResource(updateRes);
+            Files.readAllLines(Paths.get(url.toURI())).stream()
+                    .filter(this::isRecordLine)
+                    .forEach(e -> updateList.add(e));
+
+            url = AliyunJsonRecordParserTest.class.getClassLoader().getResource(deleteRes);
+            Files.readAllLines(Paths.get(url.toURI())).stream()
+                    .filter(this::isRecordLine)
+                    .forEach(e -> deleteList.add(e));
+
+        } catch (Exception e) {
+            log.error("Fail to init aliyun-json cases", e);
+        }
+    }
+
+    @Test
+    public void extractInsertRecord() throws Exception {
+        AliyunRecordParser parser =
+                new AliyunRecordParser(TypeMapping.defaultMapping(), Collections.emptyList());
+        for (String json : insertList) {
+            // 将json解析为JsonNode对象
+            JsonNode rootNode = objMapper.readValue(json, JsonNode.class);
+            CdcSourceRecord cdcRecord = new CdcSourceRecord(rootNode);
+            Schema schema = parser.buildSchema(cdcRecord);
+            Assert.assertEquals(schema.primaryKeys(), Arrays.asList("id"));
+
+            List<RichCdcMultiplexRecord> records = parser.extractRecords();
+            Assert.assertEquals(records.size(), 1);
+
+            CdcRecord result = records.get(0).toRichCdcRecord().toCdcRecord();
+            Assert.assertEquals(result.kind(), RowKind.INSERT);
+
+            String dbName = parser.getDatabaseName();
+            Assert.assertEquals(dbName, "bigdata_test");
+
+            String tableName = parser.getTableName();
+            Assert.assertEquals(tableName, "sync_test_table");
+
+            MessageQueueCdcTimestampExtractor extractor = new MessageQueueCdcTimestampExtractor();
+            Assert.assertTrue(extractor.extractTimestamp(cdcRecord) > 0);
+        }
+    }
+
+    @Test
+    public void extractUpdateRecord() throws Exception {
+        AliyunRecordParser parser =
+                new AliyunRecordParser(TypeMapping.defaultMapping(), Collections.emptyList());
+        for (String json : updateList) {
+            // 将json解析为JsonNode对象
+            JsonNode jsonNode = objMapper.readValue(json, JsonNode.class);
+            CdcSourceRecord cdcRecord = new CdcSourceRecord(jsonNode);
+            Schema schema = parser.buildSchema(cdcRecord);
+            Assert.assertEquals(schema.primaryKeys(), Arrays.asList("id"));
+
+            List<RichCdcMultiplexRecord> records = parser.extractRecords();
+            Assert.assertEquals(records.size(), 1);
+
+            CdcRecord result = records.get(0).toRichCdcRecord().toCdcRecord();
+            Assert.assertEquals(result.kind(), RowKind.UPDATE_AFTER);
+
+            String dbName = parser.getDatabaseName();
+            Assert.assertEquals(dbName, "bigdata_test");
+
+            String tableName = parser.getTableName();
+            Assert.assertEquals(tableName, "sync_test_table");
+
+            MessageQueueCdcTimestampExtractor extractor = new MessageQueueCdcTimestampExtractor();
+            Assert.assertTrue(extractor.extractTimestamp(cdcRecord) > 0);
+        }
+    }
+
+    @Test
+    public void extractDeleteRecord() throws Exception {
+        AliyunRecordParser parser =
+                new AliyunRecordParser(TypeMapping.defaultMapping(), Collections.emptyList());
+        for (String json : deleteList) {
+            // 将json解析为JsonNode对象
+            JsonNode jsonNode = objMapper.readValue(json, JsonNode.class);
+            CdcSourceRecord cdcRecord = new CdcSourceRecord(jsonNode);
+            Schema schema = parser.buildSchema(cdcRecord);
+            Assert.assertEquals(schema.primaryKeys(), Arrays.asList("id"));
+
+            List<RichCdcMultiplexRecord> records = parser.extractRecords();
+            Assert.assertEquals(records.size(), 1);
+
+            CdcRecord result = records.get(0).toRichCdcRecord().toCdcRecord();
+            Assert.assertEquals(result.kind(), RowKind.DELETE);
+
+            String dbName = parser.getDatabaseName();
+            Assert.assertEquals(dbName, "bigdata_test");
+
+            String tableName = parser.getTableName();
+            Assert.assertEquals(tableName, "sync_test_table");
+
+            MessageQueueCdcTimestampExtractor extractor = new MessageQueueCdcTimestampExtractor();
+            Assert.assertTrue(extractor.extractTimestamp(cdcRecord) > 0);
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-delete.txt b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-delete.txt
new file mode 100644
index 0000000000000..ebae6608a7556
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-delete.txt
@@ -0,0 +1,19 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+{"schema":{"dataColumn":[{"name":"id","type":"LONG"},{"name":"val","type":"DOUBLE"},{"name":"name","type":"STRING"},{"name":"create_time","type":"DATE"}],"primaryKey":["id"],"source":{"dbType":"MySQL","dbName":"bigdata_test","tableName":"sync_test_table"}},"payload":{"before":{"dataColumn":{"id":1,"val":"1.100000","name":"a","create_time":1731661114000}},"after":null,"sequenceId":"1731663842292000000","timestamp":{"eventTime":1731662085000,"systemTime":1731663848953,"checkpointTime":1731662085000},"op":"DELETE","ddl":null},"version":"0.0.1"}
\ No newline at end of file
diff --git a/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-insert.txt b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-insert.txt
new file mode 100644
index 0000000000000..d1cd34e5e6ac2
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-insert.txt
@@ -0,0 +1,19 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+{"payload":{"after":{"dataColumn":{"create_time":1731661114000,"id":2,"name":"a","val":"1.100000"}},"before":null,"ddl":null,"op":"INSERT","sequenceId":"-1","timestamp":{"checkpointTime":-1,"eventTime":-1,"systemTime":1731661820245}},"schema":{"dataColumn":[{"name":"id","type":"LONG"},{"name":"val","type":"DOUBLE"},{"name":"name","type":"STRING"},{"name":"create_time","type":"DATE"}],"primaryKey":["id"],"source":{"dbName":"bigdata_test","dbType":"MySQL","tableName":"sync_test_table"}},"version":"0.0.1"}
\ No newline at end of file
diff --git a/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-update-in-one.txt b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-update-in-one.txt
new file mode 100644
index 0000000000000..9acf6309cc481
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/resources/kafka/aliyun/table/event/event-update-in-one.txt
@@ -0,0 +1,19 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+ {"schema":{"dataColumn":[{"name":"id","type":"LONG"},{"name":"val","type":"DOUBLE"},{"name":"name","type":"STRING"},{"name":"create_time","type":"DATE"}],"primaryKey":["id"],"source":{"dbType":"MySQL","dbName":"bigdata_test","tableName":"sync_test_table"}},"payload":{"before":{"dataColumn":{"id":2,"val":"1.100000","name":"a","create_time":1731661114000}},"after":{"dataColumn":{"id":2,"val":"2.200000","name":"a","create_time":1731661114000}},"sequenceId":"1731663842292000001","timestamp":{"eventTime":1731662097000,"systemTime":1731663848979,"checkpointTime":1731662097000},"op":"UPDATE_AFTER","ddl":null},"version":"0.0.1"}
\ No newline at end of file

From be54d7d8c6494a0127b805c189c65306f6337689 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Fri, 22 Nov 2024 11:39:44 +0800
Subject: [PATCH 043/157] [hive] Determine timestamp ltz type based on hive
 runtime version (#4571)

---
 .../org/apache/paimon/hive/HiveTypeUtils.java |  4 +-
 .../hive/LocalZonedTimestampTypeUtils.java    | 23 ++++++++---
 .../hive/LocalZonedTimestampTypeUtils.java    | 40 -------------------
 3 files changed, 20 insertions(+), 47 deletions(-)
 delete mode 100644 paimon-hive/paimon-hive-connector-3.1/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java

diff --git a/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/HiveTypeUtils.java b/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/HiveTypeUtils.java
index f00d675f3750a..33cd45a351a43 100644
--- a/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/HiveTypeUtils.java
+++ b/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/HiveTypeUtils.java
@@ -185,7 +185,7 @@ public TypeInfo visit(TimestampType timestampType) {
 
         @Override
         public TypeInfo visit(LocalZonedTimestampType localZonedTimestampType) {
-            return LocalZonedTimestampTypeUtils.toHiveType(localZonedTimestampType);
+            return LocalZonedTimestampTypeUtils.hiveLocalZonedTimestampType();
         }
 
         @Override
@@ -254,7 +254,7 @@ static DataType visit(TypeInfo type, HiveToPaimonTypeVisitor visitor) {
         }
 
         public DataType atomic(TypeInfo atomic) {
-            if (LocalZonedTimestampTypeUtils.isLocalZonedTimestampType(atomic)) {
+            if (LocalZonedTimestampTypeUtils.isHiveLocalZonedTimestampType(atomic)) {
                 return DataTypes.TIMESTAMP_WITH_LOCAL_TIME_ZONE();
             }
 
diff --git a/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java b/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java
index fe76debfc333f..b143fcd8caec6 100644
--- a/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java
+++ b/paimon-hive/paimon-hive-common/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java
@@ -23,14 +23,27 @@
 import org.apache.hadoop.hive.serde2.typeinfo.TypeInfo;
 import org.apache.hadoop.hive.serde2.typeinfo.TypeInfoFactory;
 
-/** To maintain compatibility with Hive 3. */
+import java.lang.reflect.Field;
+
+/**
+ * Utils to convert between Hive TimestampLocalTZTypeInfo and Paimon {@link
+ * LocalZonedTimestampType}, using reflection to solve compatibility between Hive 2 and Hive 3.
+ */
 public class LocalZonedTimestampTypeUtils {
 
-    public static boolean isLocalZonedTimestampType(TypeInfo hiveTypeInfo) {
-        return false;
+    public static boolean isHiveLocalZonedTimestampType(TypeInfo hiveTypeInfo) {
+        return "org.apache.hadoop.hive.serde2.typeinfo.TimestampLocalTZTypeInfo"
+                .equals(hiveTypeInfo.getClass().getName());
     }
 
-    public static TypeInfo toHiveType(LocalZonedTimestampType paimonType) {
-        return TypeInfoFactory.timestampTypeInfo;
+    public static TypeInfo hiveLocalZonedTimestampType() {
+        try {
+            Class<?> typeInfoFactoryClass =
+                    Class.forName("org.apache.hadoop.hive.serde2.typeinfo.TypeInfoFactory");
+            Field field = typeInfoFactoryClass.getField("timestampLocalTZTypeInfo");
+            return (TypeInfo) field.get(null);
+        } catch (Exception e) {
+            return TypeInfoFactory.timestampTypeInfo;
+        }
     }
 }
diff --git a/paimon-hive/paimon-hive-connector-3.1/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java b/paimon-hive/paimon-hive-connector-3.1/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java
deleted file mode 100644
index b7c5d26ae6572..0000000000000
--- a/paimon-hive/paimon-hive-connector-3.1/src/main/java/org/apache/paimon/hive/LocalZonedTimestampTypeUtils.java
+++ /dev/null
@@ -1,40 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.hive;
-
-import org.apache.paimon.types.LocalZonedTimestampType;
-
-import org.apache.hadoop.hive.serde2.typeinfo.TimestampLocalTZTypeInfo;
-import org.apache.hadoop.hive.serde2.typeinfo.TypeInfo;
-import org.apache.hadoop.hive.serde2.typeinfo.TypeInfoFactory;
-
-/**
- * Utils to convert between Hive {@link TimestampLocalTZTypeInfo} and Paimon {@link
- * LocalZonedTimestampType}.
- */
-public class LocalZonedTimestampTypeUtils {
-
-    public static boolean isLocalZonedTimestampType(TypeInfo hiveTypeInfo) {
-        return hiveTypeInfo instanceof TimestampLocalTZTypeInfo;
-    }
-
-    public static TypeInfo toHiveType(LocalZonedTimestampType paimonType) {
-        return TypeInfoFactory.timestampLocalTZTypeInfo;
-    }
-}

From f0c3645741806a19b4075381555c7f61bc500809 Mon Sep 17 00:00:00 2001
From: Gang Yang <yanggang_IT_job@163.com>
Date: Fri, 22 Nov 2024 14:47:17 +0800
Subject: [PATCH 044/157] [Hive] Fix Hive DDL and paimon schema mismatched bug
 (#4561)

---
 .../org/apache/paimon/hive/HiveSchema.java    |  5 +-
 .../paimon/hive/HiveTableSchemaTest.java      | 61 +++++++++++++++----
 2 files changed, 53 insertions(+), 13 deletions(-)

diff --git a/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/HiveSchema.java b/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/HiveSchema.java
index f637651413ed6..108315a96103b 100644
--- a/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/HiveSchema.java
+++ b/paimon-hive/paimon-hive-connector-common/src/main/java/org/apache/paimon/hive/HiveSchema.java
@@ -233,9 +233,10 @@ private static void checkFieldsMatched(
             }
         }
 
-        if (schemaFieldNames.size() != hiveFieldNames.size()) {
+        // It is OK that hive is a subset of paimon
+        if (schemaFieldNames.size() < hiveFieldNames.size()) {
             throw new IllegalArgumentException(
-                    "Hive DDL and paimon schema mismatched! "
+                    "Hive DDL is a superset of paimon schema! "
                             + "It is recommended not to write any column definition "
                             + "as Paimon external table can read schema from the specified location.\n"
                             + "There are "
diff --git a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveTableSchemaTest.java b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveTableSchemaTest.java
index 07cd00c8e67ea..fe7aeac0833ae 100644
--- a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveTableSchemaTest.java
+++ b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveTableSchemaTest.java
@@ -153,6 +153,54 @@ public void testMismatchedColumnNameAndType() throws Exception {
                 .hasMessageContaining(expected);
     }
 
+    @Test
+    public void testSubsetColumnNameAndType() throws Exception {
+        createSchema();
+        Properties properties = new Properties();
+        List<String> columns = Arrays.asList("a", "b");
+        properties.setProperty("columns", String.join(",", columns));
+        properties.setProperty(
+                "columns.types",
+                String.join(
+                        ":",
+                        Arrays.asList(
+                                TypeInfoFactory.intTypeInfo.getTypeName(),
+                                TypeInfoFactory.stringTypeInfo.getTypeName(),
+                                TypeInfoFactory.getDecimalTypeInfo(6, 3).getTypeName())));
+        properties.setProperty("columns.comments", "\0\0");
+        properties.setProperty("location", tempDir.toString());
+        List<String> fields = HiveSchema.extract(null, properties).fieldNames();
+        assertThat(fields).isEqualTo(columns);
+    }
+
+    @Test
+    public void testSupersetColumnNameAndType() throws Exception {
+        createSchema();
+        Properties properties = new Properties();
+        properties.setProperty("columns", "a,b,c,d");
+        properties.setProperty(
+                "columns.types",
+                String.join(
+                        ":",
+                        Arrays.asList(
+                                TypeInfoFactory.intTypeInfo.getTypeName(),
+                                TypeInfoFactory.stringTypeInfo.getTypeName(),
+                                TypeInfoFactory.decimalTypeInfo.getTypeName(),
+                                TypeInfoFactory.stringTypeInfo.getTypeName(),
+                                TypeInfoFactory.getDecimalTypeInfo(6, 3).getTypeName())));
+        properties.setProperty("columns.comments", "\0\0");
+        properties.setProperty("location", tempDir.toString());
+        String expected =
+                "Hive DDL is a superset of paimon schema! "
+                        + "It is recommended not to write any column definition "
+                        + "as Paimon external table can read schema from the specified location.\n"
+                        + "There are 4 fields in Hive DDL: a, b, c, d\n"
+                        + "There are 3 fields in Paimon schema: a, b, c\n";
+        assertThatThrownBy(() -> HiveSchema.extract(null, properties))
+                .isInstanceOf(IllegalArgumentException.class)
+                .hasMessageContaining(expected);
+    }
+
     @Test
     public void testTooFewColumns() throws Exception {
         createSchema();
@@ -162,16 +210,7 @@ public void testTooFewColumns() throws Exception {
         properties.setProperty("columns.types", TypeInfoFactory.intTypeInfo.getTypeName());
         properties.setProperty("location", tempDir.toString());
         properties.setProperty("columns.comments", "");
-
-        String expected =
-                "Hive DDL and paimon schema mismatched! "
-                        + "It is recommended not to write any column definition "
-                        + "as Paimon external table can read schema from the specified location.\n"
-                        + "There are 1 fields in Hive DDL: a\n"
-                        + "There are 3 fields in Paimon schema: a, b, c";
-        assertThatExceptionOfType(IllegalArgumentException.class)
-                .isThrownBy(() -> HiveSchema.extract(null, properties))
-                .withMessageContaining(expected);
+        assertThat(HiveSchema.extract(null, properties)).isInstanceOf(HiveSchema.class);
     }
 
     @Test
@@ -194,7 +233,7 @@ public void testTooManyColumns() throws Exception {
         properties.setProperty("location", tempDir.toString());
 
         String expected =
-                "Hive DDL and paimon schema mismatched! "
+                "Hive DDL is a superset of paimon schema! "
                         + "It is recommended not to write any column definition "
                         + "as Paimon external table can read schema from the specified location.\n"
                         + "There are 5 fields in Hive DDL: a, b, c, d, e\n"

From c907544c4218e1ce28259915a9a6fbd18f0fb5a4 Mon Sep 17 00:00:00 2001
From: HunterXHunter <1356469429@qq.com>
Date: Fri, 22 Nov 2024 14:53:57 +0800
Subject: [PATCH 045/157] [flink] Refactor compactorSink to support extended
 compact type. (#4569)

---
 .../org/apache/paimon/flink/action/CompactAction.java  |  3 ++-
 .../paimon/flink/action/CompactDatabaseAction.java     |  3 ++-
 .../org/apache/paimon/flink/sink/CompactorSink.java    |  7 +++++--
 .../apache/paimon/flink/sink/CompactorSinkBuilder.java |  9 ++++++++-
 .../apache/paimon/flink/sink/StoreCompactOperator.java | 10 +++++-----
 .../apache/paimon/flink/sink/CompactorSinkITCase.java  |  6 ++++--
 .../paimon/flink/sink/StoreCompactOperatorTest.java    |  3 ++-
 7 files changed, 28 insertions(+), 13 deletions(-)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
index 8ea120015609c..ce88857f1b141 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
@@ -138,7 +138,8 @@ private void buildForTraditionalCompaction(
         }
         CompactorSourceBuilder sourceBuilder =
                 new CompactorSourceBuilder(identifier.getFullName(), table);
-        CompactorSinkBuilder sinkBuilder = new CompactorSinkBuilder(table);
+        CompactorSinkBuilder sinkBuilder =
+                new CompactorSinkBuilder(table).withFullCompaction(!isStreaming);
 
         sourceBuilder.withPartitionPredicate(getPredicate());
         DataStreamSource<RowData> source =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
index fda9ff695e1e3..471c6fdd4da69 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
@@ -259,7 +259,8 @@ private void buildForTraditionalCompaction(
         CompactorSourceBuilder sourceBuilder =
                 new CompactorSourceBuilder(fullName, table)
                         .withPartitionIdleTime(partitionIdleTime);
-        CompactorSinkBuilder sinkBuilder = new CompactorSinkBuilder(table);
+        CompactorSinkBuilder sinkBuilder =
+                new CompactorSinkBuilder(table).withFullCompaction(!isStreaming);
 
         DataStreamSource<RowData> source =
                 sourceBuilder.withEnv(env).withContinuousMode(isStreaming).build();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
index 7dc3ab1150b07..a0c830d73f582 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
@@ -29,14 +29,17 @@ public class CompactorSink extends FlinkSink<RowData> {
 
     private static final long serialVersionUID = 1L;
 
-    public CompactorSink(FileStoreTable table) {
+    private final boolean fullCompaction;
+
+    public CompactorSink(FileStoreTable table, boolean fullCompaction) {
         super(table, false);
+        this.fullCompaction = fullCompaction;
     }
 
     @Override
     protected OneInputStreamOperator<RowData, Committable> createWriteOperator(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new StoreCompactOperator(table, writeProvider, commitUser);
+        return new StoreCompactOperator(table, writeProvider, commitUser, fullCompaction);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
index 926155cabf291..2173b1d34a72e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
@@ -37,6 +37,8 @@ public class CompactorSinkBuilder {
 
     private DataStream<RowData> input;
 
+    private boolean fullCompaction;
+
     public CompactorSinkBuilder(FileStoreTable table) {
         this.table = table;
     }
@@ -46,6 +48,11 @@ public CompactorSinkBuilder withInput(DataStream<RowData> input) {
         return this;
     }
 
+    public CompactorSinkBuilder withFullCompaction(boolean fullCompaction) {
+        this.fullCompaction = fullCompaction;
+        return this;
+    }
+
     public DataStreamSink<?> build() {
         BucketMode bucketMode = table.bucketMode();
         switch (bucketMode) {
@@ -66,6 +73,6 @@ private DataStreamSink<?> buildForBucketAware() {
                         .orElse(null);
         DataStream<RowData> partitioned =
                 partition(input, new BucketsRowChannelComputer(), parallelism);
-        return new CompactorSink(table).sinkFrom(partitioned);
+        return new CompactorSink(table, fullCompaction).sinkFrom(partitioned);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
index bc7bb350df217..9b152a81ca225 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
@@ -52,6 +52,7 @@ public class StoreCompactOperator extends PrepareCommitOperator<RowData, Committ
     private final FileStoreTable table;
     private final StoreSinkWrite.Provider storeSinkWriteProvider;
     private final String initialCommitUser;
+    private final boolean fullCompaction;
 
     private transient StoreSinkWriteState state;
     private transient StoreSinkWrite write;
@@ -61,7 +62,8 @@ public class StoreCompactOperator extends PrepareCommitOperator<RowData, Committ
     public StoreCompactOperator(
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
-            String initialCommitUser) {
+            String initialCommitUser,
+            boolean fullCompaction) {
         super(Options.fromMap(table.options()));
         Preconditions.checkArgument(
                 !table.coreOptions().writeOnly(),
@@ -69,6 +71,7 @@ public StoreCompactOperator(
         this.table = table;
         this.storeSinkWriteProvider = storeSinkWriteProvider;
         this.initialCommitUser = initialCommitUser;
+        this.fullCompaction = fullCompaction;
     }
 
     @Override
@@ -136,10 +139,7 @@ protected List<Committable> prepareCommit(boolean waitCompaction, long checkpoin
 
         try {
             for (Pair<BinaryRow, Integer> partitionBucket : waitToCompact) {
-                write.compact(
-                        partitionBucket.getKey(),
-                        partitionBucket.getRight(),
-                        !write.streamingMode());
+                write.compact(partitionBucket.getKey(), partitionBucket.getRight(), fullCompaction);
             }
         } catch (Exception e) {
             throw new RuntimeException("Exception happens while executing compaction.", e);
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
index a5f260fb25a59..c38ac4b3d685c 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
@@ -132,7 +132,7 @@ public void testCompact() throws Exception {
                         .withContinuousMode(false)
                         .withPartitionPredicate(predicate)
                         .build();
-        new CompactorSinkBuilder(table).withInput(source).build();
+        new CompactorSinkBuilder(table).withFullCompaction(true).withInput(source).build();
         env.execute();
 
         snapshot = snapshotManager.snapshot(snapshotManager.latestSnapshotId());
@@ -182,6 +182,7 @@ public void testCompactParallelism() throws Exception {
                                                 String.valueOf(sinkParalellism));
                                     }
                                 }))
+                .withFullCompaction(false)
                 .withInput(source)
                 .build();
 
@@ -267,7 +268,8 @@ protected StoreCompactOperator createCompactOperator(FileStoreTable table) {
                                 false,
                                 memoryPool,
                                 metricGroup),
-                "test");
+                "test",
+                true);
     }
 
     protected MultiTablesStoreCompactOperator createMultiTablesCompactOperator(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
index 3f2daedffd480..f8387e1fc41a0 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
@@ -53,7 +53,8 @@ public void testCompactExactlyOnce(boolean streamingMode) throws Exception {
                         getTableDefault(),
                         (table, commitUser, state, ioManager, memoryPool, metricGroup) ->
                                 compactRememberStoreWrite,
-                        "10086");
+                        "10086",
+                        !streamingMode);
 
         TypeSerializer<Committable> serializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());

From 04f45818128405813d68edcc1b68f0857c9146dc Mon Sep 17 00:00:00 2001
From: Yubin Li <lixin58688@163.com>
Date: Fri, 22 Nov 2024 17:26:19 +0800
Subject: [PATCH 046/157] [doc] Improve doc for delete syntax (#4560)

---
 docs/content/flink/sql-write.md                               | 4 +++-
 docs/layouts/shortcodes/generated/core_configuration.html     | 2 +-
 .../src/main/java/org/apache/paimon/CoreOptions.java          | 2 +-
 3 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 33adac5fb7f49..58e90a8f6e3f5 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -211,7 +211,9 @@ UPDATE my_table SET b = 1, c = 2 WHERE a = 'myTable';
 {{< hint info >}}
 Important table properties setting:
 1. Only primary key tables support this feature.
-2. If the table has primary keys, [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine#deduplicate" >}}) to support this feature.
+2. If the table has primary keys, the following [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) support this feature:
+   * [deduplicate]({{< ref "primary-key-table/merge-engine#deduplicate" >}}).
+   * [partial-update]({{< ref "primary-key-table/merge-engine#partial-update" >}}) with option 'partial-update.remove-record-on-delete' enabled.
 3. Do not support deleting from table in streaming mode.
 {{< /hint >}}
 
diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 3efeaeb3e8a9a..a38f07784fd38 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -561,7 +561,7 @@
             <td><h5>partial-update.remove-record-on-sequence-group</h5></td>
             <td style="word-wrap: break-word;">(none)</td>
             <td>String</td>
-            <td>Whether to remove the whole row in partial-update engine when -D records of specified sequence group are received.</td>
+            <td>When -D records of the given sequence groups are received, remove the whole row.</td>
         </tr>
         <tr>
             <td><h5>partition</h5></td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index 9875e2fac45f2..fce09357f07ae 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -637,7 +637,7 @@ public class CoreOptions implements Serializable {
                     .stringType()
                     .noDefaultValue()
                     .withDescription(
-                            "Whether to remove the whole row in partial-update engine when -D records of specified sequence group are received.");
+                            "When -D records of the given sequence groups are received, remove the whole row.");
 
     @Immutable
     public static final ConfigOption<String> ROWKIND_FIELD =

From 0057538b8fc626cf4698274ccfbd71eb9d66b621 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Fri, 22 Nov 2024 19:05:39 +0800
Subject: [PATCH 047/157] [core] Ensure triggerCompaction in
 RecordWriter.isCompacting (#4574)

---
 .../src/main/java/org/apache/paimon/append/AppendOnlyWriter.java | 1 +
 .../main/java/org/apache/paimon/mergetree/MergeTreeWriter.java   | 1 +
 2 files changed, 2 insertions(+)

diff --git a/paimon-core/src/main/java/org/apache/paimon/append/AppendOnlyWriter.java b/paimon-core/src/main/java/org/apache/paimon/append/AppendOnlyWriter.java
index 47502aa707d1c..a3087e3628646 100644
--- a/paimon-core/src/main/java/org/apache/paimon/append/AppendOnlyWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/append/AppendOnlyWriter.java
@@ -211,6 +211,7 @@ public CommitIncrement prepareCommit(boolean waitCompaction) throws Exception {
 
     @Override
     public boolean isCompacting() {
+        compactManager.triggerCompaction(false);
         return compactManager.isCompacting();
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/mergetree/MergeTreeWriter.java b/paimon-core/src/main/java/org/apache/paimon/mergetree/MergeTreeWriter.java
index b73be6941e545..f2a964bae16a6 100644
--- a/paimon-core/src/main/java/org/apache/paimon/mergetree/MergeTreeWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/mergetree/MergeTreeWriter.java
@@ -279,6 +279,7 @@ public CommitIncrement prepareCommit(boolean waitCompaction) throws Exception {
 
     @Override
     public boolean isCompacting() {
+        compactManager.triggerCompaction(false);
         return compactManager.isCompacting();
     }
 

From 5f9a8fb65d079fb572f80dc682728bc1e048d46b Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Fri, 22 Nov 2024 19:11:22 +0800
Subject: [PATCH 048/157] [core] Add cache for snapshots in CachingCatalog
 (#4565)

---
 .../generated/catalog_configuration.html      |  6 ++
 .../apache/paimon/options/CatalogOptions.java |  7 +++
 .../org/apache/paimon/AbstractFileStore.java  | 10 +++-
 .../java/org/apache/paimon/FileStore.java     |  4 ++
 .../main/java/org/apache/paimon/Snapshot.java | 58 ++++++++++---------
 .../apache/paimon/catalog/CachingCatalog.java | 35 +++++++++--
 .../paimon/operation/OrphanFilesClean.java    |  3 +-
 .../paimon/privilege/PrivilegedFileStore.java |  8 +++
 .../apache/paimon/schema/SchemaManager.java   | 15 +----
 .../org/apache/paimon/schema/TableSchema.java | 39 ++++++++-----
 .../paimon/table/AbstractFileStoreTable.java  | 10 +++-
 .../org/apache/paimon/table/DataTable.java    |  3 +
 .../paimon/table/DelegatedFileStoreTable.java | 13 +++++
 .../table/FallbackReadFileStoreTable.java     |  3 +-
 .../apache/paimon/table/FileStoreTable.java   |  5 ++
 .../table/system/AggregationFieldsTable.java  |  7 +--
 .../paimon/table/system/AuditLogTable.java    |  6 ++
 .../table/system/CompactBucketsTable.java     |  6 ++
 .../paimon/table/system/FileMonitorTable.java |  6 ++
 .../paimon/table/system/FilesTable.java       |  3 +-
 .../paimon/table/system/OptionsTable.java     | 24 +++-----
 .../table/system/ReadOptimizedTable.java      |  6 ++
 .../paimon/table/system/SchemasTable.java     | 57 ++++--------------
 .../paimon/table/system/SnapshotsTable.java   |  6 +-
 .../main/java/org/apache/paimon/tag/Tag.java  | 48 +++++++--------
 .../apache/paimon/utils/BranchManager.java    |  4 +-
 .../apache/paimon/utils/SnapshotManager.java  | 54 ++++++++++++-----
 .../org/apache/paimon/utils/TagManager.java   |  8 +--
 .../paimon/catalog/CachingCatalogTest.java    | 25 +++++++-
 .../catalog/TestableCachingCatalog.java       |  9 ++-
 .../table/AppendOnlyFileDataTableTest.java    |  2 +-
 ...AppendOnlyTableColumnTypeFileDataTest.java |  2 +-
 ...AppendOnlyTableColumnTypeFileMetaTest.java |  2 +-
 .../AppendOnlyTableFileMetaFilterTest.java    |  2 +-
 .../paimon/table/FileStoreTableTestBase.java  |  4 +-
 .../PrimaryKeyColumnTypeFileDataTest.java     |  2 +-
 .../table/PrimaryKeyFileDataTableTest.java    |  2 +-
 .../table/PrimaryKeyFileMetaFilterTest.java   |  2 +-
 ...PrimaryKeyTableColumnTypeFileMetaTest.java |  2 +-
 .../paimon/utils/SnapshotManagerTest.java     |  4 +-
 40 files changed, 316 insertions(+), 196 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/catalog_configuration.html b/docs/layouts/shortcodes/generated/catalog_configuration.html
index 3686fa20c68a9..6706d5c421a1b 100644
--- a/docs/layouts/shortcodes/generated/catalog_configuration.html
+++ b/docs/layouts/shortcodes/generated/catalog_configuration.html
@@ -68,6 +68,12 @@
             <td>Long</td>
             <td>Controls the max number for which partitions in the catalog are cached.</td>
         </tr>
+        <tr>
+            <td><h5>cache.snapshot.max-num-per-table</h5></td>
+            <td style="word-wrap: break-word;">20</td>
+            <td>Integer</td>
+            <td>Controls the max number for snapshots per table in the catalog are cached.</td>
+        </tr>
         <tr>
             <td><h5>client-pool-size</h5></td>
             <td style="word-wrap: break-word;">2</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java b/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
index 6ad9f3350adfc..f69af2d599103 100644
--- a/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
@@ -123,6 +123,13 @@ public class CatalogOptions {
                     .noDefaultValue()
                     .withDescription("Controls the maximum memory to cache manifest content.");
 
+    public static final ConfigOption<Integer> CACHE_SNAPSHOT_MAX_NUM_PER_TABLE =
+            key("cache.snapshot.max-num-per-table")
+                    .intType()
+                    .defaultValue(20)
+                    .withDescription(
+                            "Controls the max number for snapshots per table in the catalog are cached.");
+
     public static final ConfigOption<String> LINEAGE_META =
             key("lineage-meta")
                     .stringType()
diff --git a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
index 14665961a8a7e..ae4552aa7150e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
@@ -54,6 +54,8 @@
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import javax.annotation.Nullable;
 
 import java.time.Duration;
@@ -79,6 +81,7 @@ abstract class AbstractFileStore<T> implements FileStore<T> {
 
     @Nullable private final SegmentsCache<Path> writeManifestCache;
     @Nullable private SegmentsCache<Path> readManifestCache;
+    @Nullable private Cache<Path, Snapshot> snapshotCache;
 
     protected AbstractFileStore(
             FileIO fileIO,
@@ -116,7 +119,7 @@ public FileStorePathFactory pathFactory() {
 
     @Override
     public SnapshotManager snapshotManager() {
-        return new SnapshotManager(fileIO, options.path(), options.branch());
+        return new SnapshotManager(fileIO, options.path(), options.branch(), snapshotCache);
     }
 
     @Override
@@ -340,4 +343,9 @@ public ServiceManager newServiceManager() {
     public void setManifestCache(SegmentsCache<Path> manifestCache) {
         this.readManifestCache = manifestCache;
     }
+
+    @Override
+    public void setSnapshotCache(Cache<Path, Snapshot> cache) {
+        this.snapshotCache = cache;
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/FileStore.java b/paimon-core/src/main/java/org/apache/paimon/FileStore.java
index f9bf4c8440bd7..e50d4ada1397b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/FileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/FileStore.java
@@ -44,6 +44,8 @@
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import javax.annotation.Nullable;
 
 import java.util.List;
@@ -107,4 +109,6 @@ public interface FileStore<T> {
     List<TagCallback> createTagCallbacks();
 
     void setManifestCache(SegmentsCache<Path> manifestCache);
+
+    void setSnapshotCache(Cache<Path, Snapshot> cache);
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/Snapshot.java b/paimon-core/src/main/java/org/apache/paimon/Snapshot.java
index 3b8d2fa15b4b1..baee7bad950e1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/Snapshot.java
+++ b/paimon-core/src/main/java/org/apache/paimon/Snapshot.java
@@ -29,9 +29,6 @@
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonInclude;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
 import javax.annotation.Nullable;
 
 import java.io.FileNotFoundException;
@@ -65,7 +62,6 @@
 @Public
 @JsonIgnoreProperties(ignoreUnknown = true)
 public class Snapshot {
-    private static final Logger LOG = LoggerFactory.getLogger(Snapshot.class);
 
     public static final long FIRST_SNAPSHOT_ID = 1;
 
@@ -355,28 +351,6 @@ public String toJson() {
         return JsonSerdeUtil.toJson(this);
     }
 
-    public static Snapshot fromJson(String json) {
-        return JsonSerdeUtil.fromJson(json, Snapshot.class);
-    }
-
-    public static Snapshot fromPath(FileIO fileIO, Path path) {
-        try {
-            return Snapshot.fromJson(fileIO.readFileUtf8(path));
-        } catch (FileNotFoundException e) {
-            String errorMessage =
-                    String.format(
-                            "Snapshot file %s does not exist. "
-                                    + "It might have been expired by other jobs operating on this table. "
-                                    + "In this case, you can avoid concurrent modification issues by configuring "
-                                    + "write-only = true and use a dedicated compaction job, or configuring "
-                                    + "different expiration thresholds for different jobs.",
-                            path);
-            throw new RuntimeException(errorMessage, e);
-        } catch (IOException e) {
-            throw new RuntimeException("Fails to read snapshot from path " + path, e);
-        }
-    }
-
     @Override
     public int hashCode() {
         return Objects.hash(
@@ -437,4 +411,36 @@ public enum CommitKind {
         /** Collect statistics. */
         ANALYZE
     }
+
+    // =================== Utils for reading =========================
+
+    public static Snapshot fromJson(String json) {
+        return JsonSerdeUtil.fromJson(json, Snapshot.class);
+    }
+
+    public static Snapshot fromPath(FileIO fileIO, Path path) {
+        try {
+            return tryFromPath(fileIO, path);
+        } catch (FileNotFoundException e) {
+            String errorMessage =
+                    String.format(
+                            "Snapshot file %s does not exist. "
+                                    + "It might have been expired by other jobs operating on this table. "
+                                    + "In this case, you can avoid concurrent modification issues by configuring "
+                                    + "write-only = true and use a dedicated compaction job, or configuring "
+                                    + "different expiration thresholds for different jobs.",
+                            path);
+            throw new RuntimeException(errorMessage, e);
+        }
+    }
+
+    public static Snapshot tryFromPath(FileIO fileIO, Path path) throws FileNotFoundException {
+        try {
+            return Snapshot.fromJson(fileIO.readFileUtf8(path));
+        } catch (FileNotFoundException e) {
+            throw e;
+        } catch (IOException e) {
+            throw new RuntimeException("Fails to read snapshot from path " + path, e);
+        }
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
index 003f0edb4fa55..1912ad60623cb 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
@@ -55,6 +55,7 @@
 import static org.apache.paimon.options.CatalogOptions.CACHE_MANIFEST_SMALL_FILE_MEMORY;
 import static org.apache.paimon.options.CatalogOptions.CACHE_MANIFEST_SMALL_FILE_THRESHOLD;
 import static org.apache.paimon.options.CatalogOptions.CACHE_PARTITION_MAX_NUM;
+import static org.apache.paimon.options.CatalogOptions.CACHE_SNAPSHOT_MAX_NUM_PER_TABLE;
 import static org.apache.paimon.table.system.SystemTableLoader.SYSTEM_TABLES;
 
 /** A {@link Catalog} to cache databases and tables and manifests. */
@@ -62,6 +63,9 @@ public class CachingCatalog extends DelegateCatalog {
 
     private static final Logger LOG = LoggerFactory.getLogger(CachingCatalog.class);
 
+    private final Duration expirationInterval;
+    private final int snapshotMaxNumPerTable;
+
     protected final Cache<String, Database> databaseCache;
     protected final Cache<Identifier, Table> tableCache;
     @Nullable protected final SegmentsCache<Path> manifestCache;
@@ -75,7 +79,8 @@ public CachingCatalog(Catalog wrapped) {
                 CACHE_EXPIRATION_INTERVAL_MS.defaultValue(),
                 CACHE_MANIFEST_SMALL_FILE_MEMORY.defaultValue(),
                 CACHE_MANIFEST_SMALL_FILE_THRESHOLD.defaultValue().getBytes(),
-                CACHE_PARTITION_MAX_NUM.defaultValue());
+                CACHE_PARTITION_MAX_NUM.defaultValue(),
+                CACHE_SNAPSHOT_MAX_NUM_PER_TABLE.defaultValue());
     }
 
     public CachingCatalog(
@@ -83,13 +88,15 @@ public CachingCatalog(
             Duration expirationInterval,
             MemorySize manifestMaxMemory,
             long manifestCacheThreshold,
-            long cachedPartitionMaxNum) {
+            long cachedPartitionMaxNum,
+            int snapshotMaxNumPerTable) {
         this(
                 wrapped,
                 expirationInterval,
                 manifestMaxMemory,
                 manifestCacheThreshold,
                 cachedPartitionMaxNum,
+                snapshotMaxNumPerTable,
                 Ticker.systemTicker());
     }
 
@@ -99,6 +106,7 @@ public CachingCatalog(
             MemorySize manifestMaxMemory,
             long manifestCacheThreshold,
             long cachedPartitionMaxNum,
+            int snapshotMaxNumPerTable,
             Ticker ticker) {
         super(wrapped);
         if (expirationInterval.isZero() || expirationInterval.isNegative()) {
@@ -106,6 +114,9 @@ public CachingCatalog(
                     "When cache.expiration-interval is set to negative or 0, the catalog cache should be disabled.");
         }
 
+        this.expirationInterval = expirationInterval;
+        this.snapshotMaxNumPerTable = snapshotMaxNumPerTable;
+
         this.databaseCache =
                 Caffeine.newBuilder()
                         .softValues()
@@ -121,6 +132,7 @@ public CachingCatalog(
                         .expireAfterAccess(expirationInterval)
                         .ticker(ticker)
                         .build();
+        this.manifestCache = SegmentsCache.create(manifestMaxMemory, manifestCacheThreshold);
         this.partitionCache =
                 cachedPartitionMaxNum == 0
                         ? null
@@ -134,7 +146,6 @@ public CachingCatalog(
                                 .maximumWeight(cachedPartitionMaxNum)
                                 .ticker(ticker)
                                 .build();
-        this.manifestCache = SegmentsCache.create(manifestMaxMemory, manifestCacheThreshold);
     }
 
     public static Catalog tryToCreate(Catalog catalog, Options options) {
@@ -155,7 +166,8 @@ public static Catalog tryToCreate(Catalog catalog, Options options) {
                 options.get(CACHE_EXPIRATION_INTERVAL_MS),
                 manifestMaxMemory,
                 manifestThreshold,
-                options.get(CACHE_PARTITION_MAX_NUM));
+                options.get(CACHE_PARTITION_MAX_NUM),
+                options.get(CACHE_SNAPSHOT_MAX_NUM_PER_TABLE));
     }
 
     @Override
@@ -244,9 +256,20 @@ public Table getTable(Identifier identifier) throws TableNotExistException {
     }
 
     private void putTableCache(Identifier identifier, Table table) {
-        if (manifestCache != null && table instanceof FileStoreTable) {
-            ((FileStoreTable) table).setManifestCache(manifestCache);
+        if (table instanceof FileStoreTable) {
+            FileStoreTable storeTable = (FileStoreTable) table;
+            storeTable.setSnapshotCache(
+                    Caffeine.newBuilder()
+                            .softValues()
+                            .expireAfterAccess(expirationInterval)
+                            .maximumSize(snapshotMaxNumPerTable)
+                            .executor(Runnable::run)
+                            .build());
+            if (manifestCache != null) {
+                storeTable.setManifestCache(manifestCache);
+            }
         }
+
         tableCache.put(identifier, table);
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java b/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
index 5698908cb9b0c..869100d9cfb8d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
@@ -105,7 +105,8 @@ protected List<String> validBranches() {
 
         List<String> abnormalBranches = new ArrayList<>();
         for (String branch : branches) {
-            if (!new SchemaManager(table.fileIO(), table.location(), branch).latest().isPresent()) {
+            SchemaManager schemaManager = table.schemaManager().copyWithBranch(branch);
+            if (!schemaManager.latest().isPresent()) {
                 abnormalBranches.add(branch);
             }
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStore.java b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStore.java
index 59243a53569ed..3ee0d5fa9b013 100644
--- a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStore.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.FileStore;
+import org.apache.paimon.Snapshot;
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.index.IndexFileHandler;
@@ -47,6 +48,8 @@
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import javax.annotation.Nullable;
 
 import java.util.List;
@@ -210,4 +213,9 @@ public List<TagCallback> createTagCallbacks() {
     public void setManifestCache(SegmentsCache<Path> manifestCache) {
         wrapped.setManifestCache(manifestCache);
     }
+
+    @Override
+    public void setSnapshotCache(Cache<Path, Snapshot> cache) {
+        wrapped.setSnapshotCache(cache);
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index a84348810b990..d827ffd0fb66b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -45,7 +45,6 @@
 import org.apache.paimon.types.ReassignFieldId;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.BranchManager;
-import org.apache.paimon.utils.JsonSerdeUtil;
 import org.apache.paimon.utils.Preconditions;
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.StringUtils;
@@ -769,11 +768,7 @@ boolean commit(TableSchema newSchema) throws Exception {
 
     /** Read schema for schema id. */
     public TableSchema schema(long id) {
-        try {
-            return JsonSerdeUtil.fromJson(fileIO.readFileUtf8(toSchemaPath(id)), TableSchema.class);
-        } catch (IOException e) {
-            throw new UncheckedIOException(e);
-        }
+        return TableSchema.fromPath(fileIO, toSchemaPath(id));
     }
 
     /** Check if a schema exists. */
@@ -789,14 +784,6 @@ public boolean schemaExists(long id) {
         }
     }
 
-    public static TableSchema fromPath(FileIO fileIO, Path path) {
-        try {
-            return JsonSerdeUtil.fromJson(fileIO.readFileUtf8(path), TableSchema.class);
-        } catch (IOException e) {
-            throw new UncheckedIOException(e);
-        }
-    }
-
     private String branchPath() {
         return BranchManager.branchPath(tableRoot, branch);
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/TableSchema.java b/paimon-core/src/main/java/org/apache/paimon/schema/TableSchema.java
index b5bdeccf10f6f..a0a149d1ae9b6 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/TableSchema.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/TableSchema.java
@@ -29,8 +29,10 @@
 
 import javax.annotation.Nullable;
 
+import java.io.FileNotFoundException;
 import java.io.IOException;
 import java.io.Serializable;
+import java.io.UncheckedIOException;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashSet;
@@ -296,19 +298,6 @@ public TableSchema copy(Map<String, String> newOptions) {
                 timeMillis);
     }
 
-    public static TableSchema fromJson(String json) {
-        return JsonSerdeUtil.fromJson(json, TableSchema.class);
-    }
-
-    public static TableSchema fromPath(FileIO fileIO, Path path) {
-        try {
-            String json = fileIO.readFileUtf8(path);
-            return TableSchema.fromJson(json);
-        } catch (IOException e) {
-            throw new RuntimeException("Fails to read schema from path " + path, e);
-        }
-    }
-
     @Override
     public String toString() {
         return JsonSerdeUtil.toJson(this);
@@ -341,4 +330,28 @@ public int hashCode() {
     public static List<DataField> newFields(RowType rowType) {
         return rowType.getFields();
     }
+
+    // =================== Utils for reading =========================
+
+    public static TableSchema fromJson(String json) {
+        return JsonSerdeUtil.fromJson(json, TableSchema.class);
+    }
+
+    public static TableSchema fromPath(FileIO fileIO, Path path) {
+        try {
+            return tryFromPath(fileIO, path);
+        } catch (FileNotFoundException e) {
+            throw new RuntimeException(e.getMessage(), e);
+        }
+    }
+
+    public static TableSchema tryFromPath(FileIO fileIO, Path path) throws FileNotFoundException {
+        try {
+            return fromJson(fileIO.readFileUtf8(path));
+        } catch (FileNotFoundException e) {
+            throw e;
+        } catch (IOException e) {
+            throw new UncheckedIOException(e);
+        }
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
index 07c0e88645ac3..4180ff11c1677 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
@@ -68,6 +68,8 @@
 import org.apache.paimon.utils.SnapshotNotExistException;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import javax.annotation.Nullable;
 
 import java.io.IOException;
@@ -123,6 +125,11 @@ public void setManifestCache(SegmentsCache<Path> manifestCache) {
         store().setManifestCache(manifestCache);
     }
 
+    @Override
+    public void setSnapshotCache(Cache<Path, Snapshot> cache) {
+        store().setSnapshotCache(cache);
+    }
+
     @Override
     public OptionalLong latestSnapshotId() {
         Long snapshot = store().snapshotManager().latestSnapshotId();
@@ -340,7 +347,8 @@ public FileStoreTable copy(TableSchema newTableSchema) {
                 : new PrimaryKeyFileStoreTable(fileIO, path, newTableSchema, catalogEnvironment);
     }
 
-    protected SchemaManager schemaManager() {
+    @Override
+    public SchemaManager schemaManager() {
         return new SchemaManager(fileIO(), path, currentBranch());
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/DataTable.java b/paimon-core/src/main/java/org/apache/paimon/table/DataTable.java
index e330db0e04a43..7979daccf7563 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/DataTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/DataTable.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.source.DataTableScan;
 import org.apache.paimon.table.source.snapshot.SnapshotReader;
 import org.apache.paimon.utils.BranchManager;
@@ -39,6 +40,8 @@ public interface DataTable extends InnerTable {
 
     SnapshotManager snapshotManager();
 
+    SchemaManager schemaManager();
+
     TagManager tagManager();
 
     BranchManager branchManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
index 2b369e5005cc4..624476b5b43e0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
@@ -27,6 +27,7 @@
 import org.apache.paimon.manifest.ManifestCacheFilter;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFileMeta;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.stats.Statistics;
 import org.apache.paimon.table.query.LocalTableQuery;
@@ -44,6 +45,8 @@
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import java.time.Duration;
 import java.util.Objects;
 import java.util.Optional;
@@ -92,6 +95,11 @@ public SnapshotManager snapshotManager() {
         return wrapped.snapshotManager();
     }
 
+    @Override
+    public SchemaManager schemaManager() {
+        return wrapped.schemaManager();
+    }
+
     @Override
     public TagManager tagManager() {
         return wrapped.tagManager();
@@ -117,6 +125,11 @@ public void setManifestCache(SegmentsCache<Path> manifestCache) {
         wrapped.setManifestCache(manifestCache);
     }
 
+    @Override
+    public void setSnapshotCache(Cache<Path, Snapshot> cache) {
+        wrapped.setSnapshotCache(cache);
+    }
+
     @Override
     public TableSchema schema() {
         return wrapped.schema();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/FallbackReadFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/FallbackReadFileStoreTable.java
index f1a60b9713f9e..e3e290f06086a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/FallbackReadFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/FallbackReadFileStoreTable.java
@@ -28,7 +28,6 @@
 import org.apache.paimon.options.Options;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.reader.RecordReader;
-import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.source.DataFilePlan;
 import org.apache.paimon.table.source.DataSplit;
@@ -103,7 +102,7 @@ public FileStoreTable switchToBranch(String branchName) {
 
     private FileStoreTable switchWrappedToBranch(String branchName) {
         Optional<TableSchema> optionalSchema =
-                new SchemaManager(wrapped.fileIO(), wrapped.location(), branchName).latest();
+                wrapped.schemaManager().copyWithBranch(branchName).latest();
         Preconditions.checkArgument(
                 optionalSchema.isPresent(), "Branch " + branchName + " does not exist");
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
index 01227dd35407c..d37e57e4e57ec 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.table;
 
 import org.apache.paimon.FileStore;
+import org.apache.paimon.Snapshot;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.ManifestCacheFilter;
@@ -30,6 +31,8 @@
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.SegmentsCache;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
@@ -42,6 +45,8 @@ public interface FileStoreTable extends DataTable {
 
     void setManifestCache(SegmentsCache<Path> manifestCache);
 
+    void setSnapshotCache(Cache<Path, Snapshot> cache);
+
     @Override
     default RowType rowType() {
         return schema().logicalRowType();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
index 10a046ca70b52..8c0eed4d6b8bf 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AggregationFieldsTable.java
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.table.system;
 
-import org.apache.paimon.CoreOptions;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
@@ -27,7 +26,6 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.reader.RecordReader;
-import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
@@ -78,14 +76,12 @@ public class AggregationFieldsTable implements ReadonlyTable {
 
     private final FileIO fileIO;
     private final Path location;
-    private final String branch;
 
     private final FileStoreTable dataTable;
 
     public AggregationFieldsTable(FileStoreTable dataTable) {
         this.fileIO = dataTable.fileIO();
         this.location = dataTable.location();
-        this.branch = CoreOptions.branch(dataTable.schema().options());
         this.dataTable = dataTable;
     }
 
@@ -192,8 +188,7 @@ public RecordReader<InternalRow> createReader(Split split) {
             if (!(split instanceof AggregationSplit)) {
                 throw new IllegalArgumentException("Unsupported split: " + split.getClass());
             }
-            Path location = ((AggregationSplit) split).location;
-            TableSchema schemas = new SchemaManager(fileIO, location, branch).latest().get();
+            TableSchema schemas = dataTable.schemaManager().latest().get();
             Iterator<InternalRow> rows = createInternalRowIterator(schemas);
             if (readType != null) {
                 rows =
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
index b0cbe0772b5e0..1cb967f8d1e27 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/AuditLogTable.java
@@ -39,6 +39,7 @@
 import org.apache.paimon.predicate.PredicateBuilder;
 import org.apache.paimon.predicate.PredicateReplaceVisitor;
 import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.DataTable;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
@@ -187,6 +188,11 @@ public SnapshotManager snapshotManager() {
         return wrapped.snapshotManager();
     }
 
+    @Override
+    public SchemaManager schemaManager() {
+        return wrapped.schemaManager();
+    }
+
     @Override
     public TagManager tagManager() {
         return wrapped.tagManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/CompactBucketsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/CompactBucketsTable.java
index ff40c9502eb78..31cecbfb15c21 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/CompactBucketsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/CompactBucketsTable.java
@@ -33,6 +33,7 @@
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.DataTable;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
@@ -145,6 +146,11 @@ public SnapshotManager snapshotManager() {
         return wrapped.snapshotManager();
     }
 
+    @Override
+    public SchemaManager schemaManager() {
+        return wrapped.schemaManager();
+    }
+
     @Override
     public TagManager tagManager() {
         return wrapped.tagManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/FileMonitorTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/FileMonitorTable.java
index fc1bb2a5b1670..522335aaa6c99 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/FileMonitorTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/FileMonitorTable.java
@@ -34,6 +34,7 @@
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.reader.RecordReader;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.DataTable;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
@@ -131,6 +132,11 @@ public SnapshotManager snapshotManager() {
         return wrapped.snapshotManager();
     }
 
+    @Override
+    public SchemaManager schemaManager() {
+        return wrapped.schemaManager();
+    }
+
     @Override
     public TagManager tagManager() {
         return wrapped.tagManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
index 0232fc2d2ddee..6dcbb322d6d0a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/FilesTable.java
@@ -143,8 +143,7 @@ public InnerTableScan newScan() {
 
     @Override
     public InnerTableRead newRead() {
-        return new FilesRead(
-                new SchemaManager(storeTable.fileIO(), storeTable.location()), storeTable);
+        return new FilesRead(storeTable.schemaManager(), storeTable);
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
index c7dec03343d09..ed20896646b2d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/OptionsTable.java
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.table.system;
 
-import org.apache.paimon.CoreOptions;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
@@ -27,7 +26,6 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.reader.RecordReader;
-import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
 import org.apache.paimon.table.Table;
@@ -44,7 +42,6 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
 
-import java.io.IOException;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.Iterator;
@@ -70,14 +67,12 @@ public class OptionsTable implements ReadonlyTable {
 
     private final FileIO fileIO;
     private final Path location;
-    private final String branch;
 
     private final FileStoreTable dataTable;
 
     public OptionsTable(FileStoreTable dataTable) {
         this.fileIO = dataTable.fileIO();
         this.location = dataTable.location();
-        this.branch = CoreOptions.branch(dataTable.schema().options());
         this.dataTable = dataTable;
     }
 
@@ -178,14 +173,20 @@ public TableRead withIOManager(IOManager ioManager) {
         }
 
         @Override
-        public RecordReader<InternalRow> createReader(Split split) throws IOException {
+        public RecordReader<InternalRow> createReader(Split split) {
             if (!(split instanceof OptionsSplit)) {
                 throw new IllegalArgumentException("Unsupported split: " + split.getClass());
             }
-            Path location = ((OptionsSplit) split).location;
             Iterator<InternalRow> rows =
                     Iterators.transform(
-                            options(fileIO, location, branch).entrySet().iterator(), this::toRow);
+                            dataTable
+                                    .schemaManager()
+                                    .latest()
+                                    .orElseThrow(() -> new RuntimeException("Table not exists."))
+                                    .options()
+                                    .entrySet()
+                                    .iterator(),
+                            this::toRow);
             if (readType != null) {
                 rows =
                         Iterators.transform(
@@ -203,11 +204,4 @@ private InternalRow toRow(Map.Entry<String, String> option) {
                     BinaryString.fromString(option.getValue()));
         }
     }
-
-    private static Map<String, String> options(FileIO fileIO, Path location, String branchName) {
-        return new SchemaManager(fileIO, location, branchName)
-                .latest()
-                .orElseThrow(() -> new RuntimeException("Table not exists."))
-                .options();
-    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
index deb149791c8ff..5308005053c8d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/ReadOptimizedTable.java
@@ -26,6 +26,7 @@
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.operation.DefaultValueAssigner;
+import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.table.DataTable;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.ReadonlyTable;
@@ -165,6 +166,11 @@ public SnapshotManager snapshotManager() {
         return wrapped.snapshotManager();
     }
 
+    @Override
+    public SchemaManager schemaManager() {
+        return wrapped.schemaManager();
+    }
+
     @Override
     public TagManager tagManager() {
         return wrapped.tagManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
index d0df75b34f512..3cb0ff4783e91 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SchemasTable.java
@@ -18,13 +18,11 @@
 
 package org.apache.paimon.table.system;
 
-import org.apache.paimon.CoreOptions;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.data.Timestamp;
 import org.apache.paimon.disk.IOManager;
-import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.predicate.And;
 import org.apache.paimon.predicate.CompoundPredicate;
@@ -61,8 +59,6 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
 
-import javax.annotation.Nullable;
-
 import java.time.Instant;
 import java.time.LocalDateTime;
 import java.time.ZoneId;
@@ -73,7 +69,6 @@
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
-import java.util.Objects;
 import java.util.Optional;
 
 import static org.apache.paimon.catalog.Catalog.SYSTEM_TABLE_SPLITTER;
@@ -98,16 +93,12 @@ public class SchemasTable implements ReadonlyTable {
                             new DataField(5, "comment", SerializationUtils.newStringType(true)),
                             new DataField(6, "update_time", new TimestampType(false, 3))));
 
-    private final FileIO fileIO;
     private final Path location;
-    private final String branch;
 
     private final FileStoreTable dataTable;
 
     public SchemasTable(FileStoreTable dataTable) {
-        this.fileIO = dataTable.fileIO();
         this.location = dataTable.location();
-        this.branch = CoreOptions.branch(dataTable.schema().options());
         this.dataTable = dataTable;
     }
 
@@ -133,7 +124,7 @@ public InnerTableScan newScan() {
 
     @Override
     public InnerTableRead newRead() {
-        return new SchemasRead(fileIO);
+        return new SchemasRead();
     }
 
     @Override
@@ -141,24 +132,16 @@ public Table copy(Map<String, String> dynamicOptions) {
         return new SchemasTable(dataTable.copy(dynamicOptions));
     }
 
-    private class SchemasScan extends ReadOnceTableScan {
-        private @Nullable LeafPredicate schemaId;
+    private static class SchemasScan extends ReadOnceTableScan {
 
         @Override
-        public InnerTableScan withFilter(Predicate predicate) {
-            if (predicate == null) {
-                return this;
-            }
-
-            Map<String, LeafPredicate> leafPredicates =
-                    predicate.visit(LeafPredicateExtractor.INSTANCE);
-            schemaId = leafPredicates.get("schema_id");
-            return this;
+        public Plan innerPlan() {
+            return () -> Collections.singletonList(new SchemasSplit());
         }
 
         @Override
-        public Plan innerPlan() {
-            return () -> Collections.singletonList(new SchemasSplit(location, schemaId));
+        public InnerTableScan withFilter(Predicate predicate) {
+            return this;
         }
     }
 
@@ -167,47 +150,29 @@ private static class SchemasSplit extends SingletonSplit {
 
         private static final long serialVersionUID = 1L;
 
-        private final Path location;
-
-        private final @Nullable LeafPredicate schemaId;
-
-        private SchemasSplit(Path location, @Nullable LeafPredicate schemaId) {
-            this.location = location;
-            this.schemaId = schemaId;
-        }
-
+        @Override
         public boolean equals(Object o) {
             if (this == o) {
                 return true;
             }
-            if (o == null || getClass() != o.getClass()) {
-                return false;
-            }
-            SchemasSplit that = (SchemasSplit) o;
-            return Objects.equals(location, that.location)
-                    && Objects.equals(schemaId, that.schemaId);
+            return o != null && getClass() == o.getClass();
         }
 
         @Override
         public int hashCode() {
-            return Objects.hash(location, schemaId);
+            return 0;
         }
     }
 
     /** {@link TableRead} implementation for {@link SchemasTable}. */
     private class SchemasRead implements InnerTableRead {
 
-        private final FileIO fileIO;
         private RowType readType;
 
         private Optional<Long> optionalFilterSchemaIdMax = Optional.empty();
         private Optional<Long> optionalFilterSchemaIdMin = Optional.empty();
         private final List<Long> schemaIds = new ArrayList<>();
 
-        public SchemasRead(FileIO fileIO) {
-            this.fileIO = fileIO;
-        }
-
         @Override
         public InnerTableRead withFilter(Predicate predicate) {
             if (predicate == null) {
@@ -287,9 +252,7 @@ public RecordReader<InternalRow> createReader(Split split) {
             if (!(split instanceof SchemasSplit)) {
                 throw new IllegalArgumentException("Unsupported split: " + split.getClass());
             }
-            SchemasSplit schemasSplit = (SchemasSplit) split;
-            Path location = schemasSplit.location;
-            SchemaManager manager = new SchemaManager(fileIO, location, branch);
+            SchemaManager manager = dataTable.schemaManager();
 
             Collection<TableSchema> tableSchemas;
             if (!schemaIds.isEmpty()) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
index 10e5b691acc32..2af13ee937bd5 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SnapshotsTable.java
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.table.system;
 
-import org.apache.paimon.CoreOptions;
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.GenericRow;
@@ -111,14 +110,12 @@ public class SnapshotsTable implements ReadonlyTable {
 
     private final FileIO fileIO;
     private final Path location;
-    private final String branch;
 
     private final FileStoreTable dataTable;
 
     public SnapshotsTable(FileStoreTable dataTable) {
         this.fileIO = dataTable.fileIO();
         this.location = dataTable.location();
-        this.branch = CoreOptions.branch(dataTable.schema().options());
         this.dataTable = dataTable;
     }
 
@@ -289,9 +286,8 @@ public RecordReader<InternalRow> createReader(Split split) throws IOException {
             if (!(split instanceof SnapshotsSplit)) {
                 throw new IllegalArgumentException("Unsupported split: " + split.getClass());
             }
-            SnapshotManager snapshotManager =
-                    new SnapshotManager(fileIO, ((SnapshotsSplit) split).location, branch);
 
+            SnapshotManager snapshotManager = dataTable.snapshotManager();
             Iterator<Snapshot> snapshots;
             if (!snapshotIds.isEmpty()) {
                 snapshots = snapshotManager.snapshotsWithId(snapshotIds);
diff --git a/paimon-core/src/main/java/org/apache/paimon/tag/Tag.java b/paimon-core/src/main/java/org/apache/paimon/tag/Tag.java
index f1ac879d33a79..53641a2eb69f0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/tag/Tag.java
+++ b/paimon-core/src/main/java/org/apache/paimon/tag/Tag.java
@@ -33,6 +33,7 @@
 
 import java.io.FileNotFoundException;
 import java.io.IOException;
+import java.io.UncheckedIOException;
 import java.time.Duration;
 import java.time.LocalDateTime;
 import java.util.Map;
@@ -113,29 +114,6 @@ public String toJson() {
         return JsonSerdeUtil.toJson(this);
     }
 
-    public static Tag fromJson(String json) {
-        return JsonSerdeUtil.fromJson(json, Tag.class);
-    }
-
-    public static Tag fromPath(FileIO fileIO, Path path) {
-        try {
-            String json = fileIO.readFileUtf8(path);
-            return Tag.fromJson(json);
-        } catch (IOException e) {
-            throw new RuntimeException("Fails to read tag from path " + path, e);
-        }
-    }
-
-    @Nullable
-    public static Tag safelyFromPath(FileIO fileIO, Path path) throws IOException {
-        try {
-            String json = fileIO.readFileUtf8(path);
-            return Tag.fromJson(json);
-        } catch (FileNotFoundException e) {
-            return null;
-        }
-    }
-
     public static Tag fromSnapshotAndTagTtl(
             Snapshot snapshot, Duration tagTimeRetained, LocalDateTime tagCreateTime) {
         return new Tag(
@@ -201,4 +179,28 @@ public boolean equals(Object o) {
         return Objects.equals(tagCreateTime, that.tagCreateTime)
                 && Objects.equals(tagTimeRetained, that.tagTimeRetained);
     }
+
+    // =================== Utils for reading =========================
+
+    public static Tag fromJson(String json) {
+        return JsonSerdeUtil.fromJson(json, Tag.class);
+    }
+
+    public static Tag fromPath(FileIO fileIO, Path path) {
+        try {
+            return tryFromPath(fileIO, path);
+        } catch (FileNotFoundException e) {
+            throw new RuntimeException(e.getMessage(), e);
+        }
+    }
+
+    public static Tag tryFromPath(FileIO fileIO, Path path) throws FileNotFoundException {
+        try {
+            return fromJson(fileIO.readFileUtf8(path));
+        } catch (FileNotFoundException e) {
+            throw e;
+        } catch (IOException e) {
+            throw new UncheckedIOException(e);
+        }
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/BranchManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/BranchManager.java
index bc353bb10d163..2ea5f542f4e52 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/BranchManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/BranchManager.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.tag.Tag;
 
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -178,7 +179,7 @@ public void fastForward(String branchName) {
             List<Path> deleteSchemaPaths = schemaManager.schemaPaths(id -> id >= earliestSchemaId);
             List<Path> deleteTagPaths =
                     tagManager.tagPaths(
-                            path -> Snapshot.fromPath(fileIO, path).id() >= earliestSnapshotId);
+                            path -> Tag.fromPath(fileIO, path).id() >= earliestSnapshotId);
 
             List<Path> deletePaths =
                     Stream.of(deleteSnapshotPaths, deleteSchemaPaths, deleteTagPaths)
@@ -201,6 +202,7 @@ public void fastForward(String branchName) {
                     tagManager.copyWithBranch(branchName).tagDirectory(),
                     tagManager.tagDirectory(),
                     true);
+            snapshotManager.invalidateCache();
         } catch (IOException e) {
             throw new RuntimeException(
                     String.format(
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
index 5902d4c84cf59..9a120042eaaad 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
@@ -24,6 +24,8 @@
 import org.apache.paimon.fs.FileStatus;
 import org.apache.paimon.fs.Path;
 
+import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
+
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
@@ -74,16 +76,26 @@ public class SnapshotManager implements Serializable {
     private final FileIO fileIO;
     private final Path tablePath;
     private final String branch;
+    @Nullable private final Cache<Path, Snapshot> cache;
 
     public SnapshotManager(FileIO fileIO, Path tablePath) {
         this(fileIO, tablePath, DEFAULT_MAIN_BRANCH);
     }
 
     /** Specify the default branch for data writing. */
-    public SnapshotManager(FileIO fileIO, Path tablePath, String branchName) {
+    public SnapshotManager(FileIO fileIO, Path tablePath, @Nullable String branchName) {
+        this(fileIO, tablePath, branchName, null);
+    }
+
+    public SnapshotManager(
+            FileIO fileIO,
+            Path tablePath,
+            @Nullable String branchName,
+            @Nullable Cache<Path, Snapshot> cache) {
         this.fileIO = fileIO;
         this.tablePath = tablePath;
         this.branch = BranchManager.normalizeBranch(branchName);
+        this.cache = cache;
     }
 
     public SnapshotManager copyWithBranch(String branchName) {
@@ -120,20 +132,34 @@ public Path snapshotDirectory() {
         return new Path(branchPath(tablePath, branch) + "/snapshot");
     }
 
+    public void invalidateCache() {
+        if (cache != null) {
+            cache.invalidateAll();
+        }
+    }
+
     public Snapshot snapshot(long snapshotId) {
-        Path snapshotPath = snapshotPath(snapshotId);
-        return Snapshot.fromPath(fileIO, snapshotPath);
+        Path path = snapshotPath(snapshotId);
+        Snapshot snapshot = cache == null ? null : cache.getIfPresent(path);
+        if (snapshot == null) {
+            snapshot = Snapshot.fromPath(fileIO, path);
+            if (cache != null) {
+                cache.put(path, snapshot);
+            }
+        }
+        return snapshot;
     }
 
     public Snapshot tryGetSnapshot(long snapshotId) throws FileNotFoundException {
-        try {
-            Path snapshotPath = snapshotPath(snapshotId);
-            return Snapshot.fromJson(fileIO.readFileUtf8(snapshotPath));
-        } catch (FileNotFoundException fileNotFoundException) {
-            throw fileNotFoundException;
-        } catch (IOException ioException) {
-            throw new RuntimeException(ioException);
+        Path path = snapshotPath(snapshotId);
+        Snapshot snapshot = cache == null ? null : cache.getIfPresent(path);
+        if (snapshot == null) {
+            snapshot = Snapshot.tryFromPath(fileIO, path);
+            if (cache != null) {
+                cache.put(path, snapshot);
+            }
         }
+        return snapshot;
     }
 
     public Changelog changelog(long snapshotId) {
@@ -486,11 +512,9 @@ public List<Snapshot> safelyGetAllSnapshots() throws IOException {
         collectSnapshots(
                 path -> {
                     try {
-                        snapshots.add(Snapshot.fromJson(fileIO.readFileUtf8(path)));
-                    } catch (IOException e) {
-                        if (!(e instanceof FileNotFoundException)) {
-                            throw new RuntimeException(e);
-                        }
+                        // do not pollution cache
+                        snapshots.add(Snapshot.tryFromPath(fileIO, path));
+                    } catch (FileNotFoundException ignored) {
                     }
                 },
                 paths);
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
index 65963aafdf6ba..1e05a100d741c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
@@ -353,7 +353,7 @@ public SortedMap<Snapshot, List<String>> tags(Predicate<String> filter) {
                 // If the tag file is not found, it might be deleted by
                 // other processes, so just skip this tag
                 try {
-                    Snapshot snapshot = Snapshot.fromJson(fileIO.readFileUtf8(path));
+                    Snapshot snapshot = Tag.tryFromPath(fileIO, path).trimToSnapshot();
                     tags.computeIfAbsent(snapshot, s -> new ArrayList<>()).add(tagName);
                 } catch (FileNotFoundException ignored) {
                 }
@@ -371,9 +371,9 @@ public List<Pair<Tag, String>> tagObjects() {
             List<Pair<Tag, String>> tags = new ArrayList<>();
             for (Path path : paths) {
                 String tagName = path.getName().substring(TAG_PREFIX.length());
-                Tag tag = Tag.safelyFromPath(fileIO, path);
-                if (tag != null) {
-                    tags.add(Pair.of(tag, tagName));
+                try {
+                    tags.add(Pair.of(Tag.tryFromPath(fileIO, path), tagName));
+                } catch (FileNotFoundException ignored) {
                 }
             }
             return tags;
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
index 65ed5ce0b7bf5..e4f0a1510b8de 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.catalog;
 
+import org.apache.paimon.Snapshot;
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.PartitionEntry;
@@ -332,6 +333,27 @@ public static Identifier[] sysTables(Identifier tableIdent) {
                 .toArray(Identifier[]::new);
     }
 
+    @Test
+    public void testSnapshotCache() throws Exception {
+        TestableCachingCatalog wrappedCatalog =
+                new TestableCachingCatalog(this.catalog, EXPIRATION_TTL, ticker);
+        Identifier tableIdent = new Identifier("db", "tbl");
+        wrappedCatalog.createTable(tableIdent, DEFAULT_TABLE_SCHEMA, false);
+        Table table = wrappedCatalog.getTable(tableIdent);
+
+        // write
+        BatchWriteBuilder writeBuilder = table.newBatchWriteBuilder();
+        try (BatchTableWrite write = writeBuilder.newWrite();
+                BatchTableCommit commit = writeBuilder.newCommit()) {
+            write.write(GenericRow.of(1, fromString("1"), fromString("1")));
+            write.write(GenericRow.of(2, fromString("2"), fromString("2")));
+            commit.commit(write.prepareCommit());
+        }
+
+        Snapshot snapshot = table.snapshot(1);
+        assertThat(snapshot).isSameAs(table.snapshot(1));
+    }
+
     @Test
     public void testManifestCache() throws Exception {
         innerTestManifestCache(Long.MAX_VALUE);
@@ -346,7 +368,8 @@ private void innerTestManifestCache(long manifestCacheThreshold) throws Exceptio
                         Duration.ofSeconds(10),
                         MemorySize.ofMebiBytes(1),
                         manifestCacheThreshold,
-                        0L);
+                        0L,
+                        10);
         Identifier tableIdent = new Identifier("db", "tbl");
         catalog.dropTable(tableIdent, true);
         catalog.createTable(tableIdent, DEFAULT_TABLE_SCHEMA, false);
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/TestableCachingCatalog.java b/paimon-core/src/test/java/org/apache/paimon/catalog/TestableCachingCatalog.java
index 4c70a0232c44f..1d4a9b0e8a58d 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/TestableCachingCatalog.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/TestableCachingCatalog.java
@@ -38,7 +38,14 @@ public class TestableCachingCatalog extends CachingCatalog {
     private final Duration cacheExpirationInterval;
 
     public TestableCachingCatalog(Catalog catalog, Duration expirationInterval, Ticker ticker) {
-        super(catalog, expirationInterval, MemorySize.ZERO, Long.MAX_VALUE, Long.MAX_VALUE, ticker);
+        super(
+                catalog,
+                expirationInterval,
+                MemorySize.ZERO,
+                Long.MAX_VALUE,
+                Long.MAX_VALUE,
+                Integer.MAX_VALUE,
+                ticker);
         this.cacheExpirationInterval = expirationInterval;
     }
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileDataTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileDataTableTest.java
index 93854e7661987..9ce3db0b1ada0 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileDataTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileDataTableTest.java
@@ -33,7 +33,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         return new AppendOnlyFileStoreTable(
                 FileIOFinder.find(tablePath), tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileDataTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileDataTest.java
index b4c16cef20a7a..64d0c728d10b2 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileDataTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileDataTest.java
@@ -37,7 +37,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new AppendOnlyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileMetaTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileMetaTest.java
index f398d28cc524f..300483a9f34bf 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileMetaTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableColumnTypeFileMetaTest.java
@@ -40,7 +40,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new AppendOnlyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableFileMetaFilterTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableFileMetaFilterTest.java
index f65546af75d84..85ed80299736e 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableFileMetaFilterTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyTableFileMetaFilterTest.java
@@ -40,7 +40,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new AppendOnlyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java b/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
index 4d8408955d380..75e284a68c3a9 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/FileStoreTableTestBase.java
@@ -1193,7 +1193,7 @@ public void testCreateBranch() throws Exception {
         SchemaManager schemaManager =
                 new SchemaManager(new TraceableFileIO(), tablePath, "test-branch");
         TableSchema branchSchema =
-                SchemaManager.fromPath(new TraceableFileIO(), schemaManager.toSchemaPath(0));
+                TableSchema.fromPath(new TraceableFileIO(), schemaManager.toSchemaPath(0));
         TableSchema schema0 = schemaManager.schema(0);
         assertThat(branchSchema.equals(schema0)).isTrue();
     }
@@ -1344,7 +1344,7 @@ public void testFastForward() throws Exception {
         // verify schema in branch1 and main branch is same
         SchemaManager schemaManager = new SchemaManager(new TraceableFileIO(), tablePath);
         TableSchema branchSchema =
-                SchemaManager.fromPath(
+                TableSchema.fromPath(
                         new TraceableFileIO(),
                         schemaManager.copyWithBranch(BRANCH_NAME).toSchemaPath(0));
         TableSchema schema0 = schemaManager.schema(0);
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyColumnTypeFileDataTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyColumnTypeFileDataTest.java
index 8ba25c6617fe5..64bb5f21abbb4 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyColumnTypeFileDataTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyColumnTypeFileDataTest.java
@@ -91,7 +91,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new PrimaryKeyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileDataTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileDataTableTest.java
index 1be321975466f..ba98138044985 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileDataTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileDataTableTest.java
@@ -247,7 +247,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         return new PrimaryKeyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
 
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileMetaFilterTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileMetaFilterTest.java
index 618e8691c65dc..88928fe991bcb 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileMetaFilterTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileMetaFilterTest.java
@@ -146,7 +146,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new PrimaryKeyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyTableColumnTypeFileMetaTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyTableColumnTypeFileMetaTest.java
index 489c1ba052174..32a4138be564f 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyTableColumnTypeFileMetaTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyTableColumnTypeFileMetaTest.java
@@ -54,7 +54,7 @@ protected FileStoreTable createFileStoreTable(Map<Long, TableSchema> tableSchema
         SchemaManager schemaManager = new TestingSchemaManager(tablePath, tableSchemas);
         return new PrimaryKeyFileStoreTable(fileIO, tablePath, schemaManager.latest().get()) {
             @Override
-            protected SchemaManager schemaManager() {
+            public SchemaManager schemaManager() {
                 return schemaManager;
             }
         };
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/SnapshotManagerTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/SnapshotManagerTest.java
index 6b7b28263af02..26480cf411bb5 100644
--- a/paimon-core/src/test/java/org/apache/paimon/utils/SnapshotManagerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/SnapshotManagerTest.java
@@ -281,8 +281,8 @@ public void testLatestSnapshotOfUser() throws IOException, InterruptedException
     @Test
     public void testTraversalSnapshotsFromLatestSafely() throws IOException, InterruptedException {
         FileIO localFileIO = LocalFileIO.create();
-        SnapshotManager snapshotManager =
-                new SnapshotManager(localFileIO, new Path(tempDir.toString()));
+        Path path = new Path(tempDir.toString());
+        SnapshotManager snapshotManager = new SnapshotManager(localFileIO, path);
         // create 10 snapshots
         for (long i = 0; i < 10; i++) {
             Snapshot snapshot =

From 16a405882cd8f0ca9afbe8566b919aef930144ef Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Fri, 22 Nov 2024 19:14:47 +0800
Subject: [PATCH 049/157] [core] Improve object table for fileIO, Privileged
 and parent_path (#4575)

---
 .../paimon/catalog/AbstractCatalog.java       | 46 +++++++---
 .../paimon/privilege/PrivilegedCatalog.java   |  2 +-
 .../privilege/PrivilegedFileStoreTable.java   | 78 +++++++++-------
 .../privilege/PrivilegedObjectTable.java      | 92 +++++++++++++++++++
 .../paimon/table/FileStoreTableFactory.java   | 16 +---
 .../paimon/table/object/ObjectRefresh.java    | 11 ++-
 .../paimon/table/object/ObjectTable.java      | 55 ++++++++---
 .../paimon/flink/ObjectTableITCase.java       | 27 ++++++
 8 files changed, 252 insertions(+), 75 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedObjectTable.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index fff593aabb628..d3a8d628a2bc6 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.catalog;
 
 import org.apache.paimon.CoreOptions;
+import org.apache.paimon.TableType;
 import org.apache.paimon.factories.FactoryUtil;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.FileStatus;
@@ -66,6 +67,7 @@
 import static org.apache.paimon.options.CatalogOptions.LOCK_TYPE;
 import static org.apache.paimon.utils.BranchManager.DEFAULT_MAIN_BRANCH;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
+import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
 /** Common implementation of {@link Catalog}. */
 public abstract class AbstractCatalog implements Catalog {
@@ -430,17 +432,39 @@ public Table getTable(Identifier identifier) throws TableNotExistException {
     protected Table getDataOrFormatTable(Identifier identifier) throws TableNotExistException {
         Preconditions.checkArgument(identifier.getSystemTableName() == null);
         TableMeta tableMeta = getDataTableMeta(identifier);
-        return FileStoreTableFactory.create(
-                fileIO,
-                getTableLocation(identifier),
-                tableMeta.schema,
-                new CatalogEnvironment(
-                        identifier,
-                        tableMeta.uuid,
-                        Lock.factory(
-                                lockFactory().orElse(null), lockContext().orElse(null), identifier),
-                        metastoreClientFactory(identifier, tableMeta.schema).orElse(null),
-                        lineageMetaFactory));
+        FileStoreTable table =
+                FileStoreTableFactory.create(
+                        fileIO,
+                        getTableLocation(identifier),
+                        tableMeta.schema,
+                        new CatalogEnvironment(
+                                identifier,
+                                tableMeta.uuid,
+                                Lock.factory(
+                                        lockFactory().orElse(null),
+                                        lockContext().orElse(null),
+                                        identifier),
+                                metastoreClientFactory(identifier, tableMeta.schema).orElse(null),
+                                lineageMetaFactory));
+        CoreOptions options = table.coreOptions();
+        if (options.type() == TableType.OBJECT_TABLE) {
+            String objectLocation = options.objectLocation();
+            checkNotNull(objectLocation, "Object location should not be null for object table.");
+            table =
+                    ObjectTable.builder()
+                            .underlyingTable(table)
+                            .objectLocation(objectLocation)
+                            .objectFileIO(objectFileIO(objectLocation))
+                            .build();
+        }
+        return table;
+    }
+
+    /**
+     * Catalog implementation may override this method to provide {@link FileIO} to object table.
+     */
+    protected FileIO objectFileIO(String objectLocation) {
+        return fileIO;
     }
 
     /**
diff --git a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedCatalog.java b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedCatalog.java
index c9b9c21937be8..2e88213a24b95 100644
--- a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedCatalog.java
@@ -127,7 +127,7 @@ public void alterTable(
     public Table getTable(Identifier identifier) throws TableNotExistException {
         Table table = wrapped.getTable(identifier);
         if (table instanceof FileStoreTable) {
-            return new PrivilegedFileStoreTable(
+            return PrivilegedFileStoreTable.wrap(
                     (FileStoreTable) table, privilegeManager.getPrivilegeChecker(), identifier);
         } else {
             return table;
diff --git a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStoreTable.java
index 37990ed5a1f3b..52c806c7c53b2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedFileStoreTable.java
@@ -27,6 +27,7 @@
 import org.apache.paimon.table.DelegatedFileStoreTable;
 import org.apache.paimon.table.ExpireSnapshots;
 import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.object.ObjectTable;
 import org.apache.paimon.table.query.LocalTableQuery;
 import org.apache.paimon.table.sink.TableCommitImpl;
 import org.apache.paimon.table.sink.TableWriteImpl;
@@ -48,10 +49,10 @@
 /** {@link FileStoreTable} with privilege checks. */
 public class PrivilegedFileStoreTable extends DelegatedFileStoreTable {
 
-    private final PrivilegeChecker privilegeChecker;
-    private final Identifier identifier;
+    protected final PrivilegeChecker privilegeChecker;
+    protected final Identifier identifier;
 
-    public PrivilegedFileStoreTable(
+    protected PrivilegedFileStoreTable(
             FileStoreTable wrapped, PrivilegeChecker privilegeChecker, Identifier identifier) {
         super(wrapped);
         this.privilegeChecker = privilegeChecker;
@@ -106,18 +107,6 @@ public Optional<Statistics> statistics() {
         return wrapped.statistics();
     }
 
-    @Override
-    public FileStoreTable copy(Map<String, String> dynamicOptions) {
-        return new PrivilegedFileStoreTable(
-                wrapped.copy(dynamicOptions), privilegeChecker, identifier);
-    }
-
-    @Override
-    public FileStoreTable copy(TableSchema newTableSchema) {
-        return new PrivilegedFileStoreTable(
-                wrapped.copy(newTableSchema), privilegeChecker, identifier);
-    }
-
     @Override
     public void rollbackTo(long snapshotId) {
         privilegeChecker.assertCanInsert(identifier);
@@ -202,18 +191,6 @@ public ExpireSnapshots newExpireChangelog() {
         return wrapped.newExpireChangelog();
     }
 
-    @Override
-    public FileStoreTable copyWithoutTimeTravel(Map<String, String> dynamicOptions) {
-        return new PrivilegedFileStoreTable(
-                wrapped.copyWithoutTimeTravel(dynamicOptions), privilegeChecker, identifier);
-    }
-
-    @Override
-    public FileStoreTable copyWithLatestSchema() {
-        return new PrivilegedFileStoreTable(
-                wrapped.copyWithLatestSchema(), privilegeChecker, identifier);
-    }
-
     @Override
     public DataTableScan newScan() {
         privilegeChecker.assertCanSelect(identifier);
@@ -262,11 +239,7 @@ public LocalTableQuery newLocalTableQuery() {
         return wrapped.newLocalTableQuery();
     }
 
-    @Override
-    public FileStoreTable switchToBranch(String branchName) {
-        return new PrivilegedFileStoreTable(
-                wrapped.switchToBranch(branchName), privilegeChecker, identifier);
-    }
+    // ======================= equals ============================
 
     @Override
     public boolean equals(Object o) {
@@ -281,4 +254,45 @@ public boolean equals(Object o) {
                 && Objects.equals(privilegeChecker, that.privilegeChecker)
                 && Objects.equals(identifier, that.identifier);
     }
+
+    // ======================= copy ============================
+
+    @Override
+    public PrivilegedFileStoreTable copy(Map<String, String> dynamicOptions) {
+        return new PrivilegedFileStoreTable(
+                wrapped.copy(dynamicOptions), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedFileStoreTable copy(TableSchema newTableSchema) {
+        return new PrivilegedFileStoreTable(
+                wrapped.copy(newTableSchema), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedFileStoreTable copyWithoutTimeTravel(Map<String, String> dynamicOptions) {
+        return new PrivilegedFileStoreTable(
+                wrapped.copyWithoutTimeTravel(dynamicOptions), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedFileStoreTable copyWithLatestSchema() {
+        return new PrivilegedFileStoreTable(
+                wrapped.copyWithLatestSchema(), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedFileStoreTable switchToBranch(String branchName) {
+        return new PrivilegedFileStoreTable(
+                wrapped.switchToBranch(branchName), privilegeChecker, identifier);
+    }
+
+    public static PrivilegedFileStoreTable wrap(
+            FileStoreTable table, PrivilegeChecker privilegeChecker, Identifier identifier) {
+        if (table instanceof ObjectTable) {
+            return new PrivilegedObjectTable((ObjectTable) table, privilegeChecker, identifier);
+        } else {
+            return new PrivilegedFileStoreTable(table, privilegeChecker, identifier);
+        }
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedObjectTable.java b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedObjectTable.java
new file mode 100644
index 0000000000000..c5a319c1fedd4
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/privilege/PrivilegedObjectTable.java
@@ -0,0 +1,92 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.privilege;
+
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.object.ObjectTable;
+
+import java.util.Map;
+
+/** A {@link PrivilegedFileStoreTable} for {@link ObjectTable}. */
+public class PrivilegedObjectTable extends PrivilegedFileStoreTable implements ObjectTable {
+
+    private final ObjectTable objectTable;
+
+    protected PrivilegedObjectTable(
+            ObjectTable wrapped, PrivilegeChecker privilegeChecker, Identifier identifier) {
+        super(wrapped, privilegeChecker, identifier);
+        this.objectTable = wrapped;
+    }
+
+    @Override
+    public String objectLocation() {
+        return objectTable.objectLocation();
+    }
+
+    @Override
+    public FileStoreTable underlyingTable() {
+        return objectTable.underlyingTable();
+    }
+
+    @Override
+    public FileIO objectFileIO() {
+        return objectTable.objectFileIO();
+    }
+
+    @Override
+    public long refresh() {
+        privilegeChecker.assertCanInsert(identifier);
+        return objectTable.refresh();
+    }
+
+    // ======================= copy ============================
+
+    @Override
+    public PrivilegedObjectTable copy(Map<String, String> dynamicOptions) {
+        return new PrivilegedObjectTable(
+                objectTable.copy(dynamicOptions), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedObjectTable copy(TableSchema newTableSchema) {
+        return new PrivilegedObjectTable(
+                objectTable.copy(newTableSchema), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedObjectTable copyWithoutTimeTravel(Map<String, String> dynamicOptions) {
+        return new PrivilegedObjectTable(
+                objectTable.copyWithoutTimeTravel(dynamicOptions), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedObjectTable copyWithLatestSchema() {
+        return new PrivilegedObjectTable(
+                objectTable.copyWithLatestSchema(), privilegeChecker, identifier);
+    }
+
+    @Override
+    public PrivilegedObjectTable switchToBranch(String branchName) {
+        return new PrivilegedObjectTable(
+                objectTable.switchToBranch(branchName), privilegeChecker, identifier);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTableFactory.java b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTableFactory.java
index 47d8777241d6c..423dc17263195 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTableFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTableFactory.java
@@ -19,14 +19,12 @@
 package org.apache.paimon.table;
 
 import org.apache.paimon.CoreOptions;
-import org.apache.paimon.TableType;
 import org.apache.paimon.catalog.CatalogContext;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
-import org.apache.paimon.table.object.ObjectTable;
 import org.apache.paimon.utils.StringUtils;
 
 import java.io.IOException;
@@ -35,7 +33,6 @@
 
 import static org.apache.paimon.CoreOptions.PATH;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
-import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
 /** Factory to create {@link FileStoreTable}. */
 public class FileStoreTableFactory {
@@ -127,17 +124,6 @@ public static FileStoreTable createWithoutFallbackBranch(
                                 fileIO, tablePath, tableSchema, catalogEnvironment)
                         : new PrimaryKeyFileStoreTable(
                                 fileIO, tablePath, tableSchema, catalogEnvironment);
-        table = table.copy(dynamicOptions.toMap());
-        CoreOptions options = table.coreOptions();
-        if (options.type() == TableType.OBJECT_TABLE) {
-            String objectLocation = options.objectLocation();
-            checkNotNull(objectLocation, "Object location should not be null for object table.");
-            table =
-                    ObjectTable.builder()
-                            .underlyingTable(table)
-                            .objectLocation(objectLocation)
-                            .build();
-        }
-        return table;
+        return table.copy(dynamicOptions.toMap());
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectRefresh.java b/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectRefresh.java
index 326efbc0eac83..b1be840c51536 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectRefresh.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectRefresh.java
@@ -26,7 +26,6 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.FileStatus;
 import org.apache.paimon.fs.Path;
-import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.sink.BatchTableCommit;
 import org.apache.paimon.table.sink.BatchTableWrite;
 import org.apache.paimon.table.sink.BatchWriteBuilder;
@@ -41,13 +40,14 @@ public class ObjectRefresh {
 
     public static long refresh(ObjectTable table) throws Exception {
         String location = table.objectLocation();
-        FileStoreTable underlyingTable = table.underlyingTable();
-        FileIO fileIO = underlyingTable.fileIO();
 
+        // 1. collect all files for object table
         List<FileStatus> fileCollector = new ArrayList<>();
-        listAllFiles(fileIO, new Path(location), fileCollector);
+        listAllFiles(table.objectFileIO(), new Path(location), fileCollector);
 
-        BatchWriteBuilder writeBuilder = underlyingTable.newBatchWriteBuilder().withOverwrite();
+        // 2. write to underlying table
+        BatchWriteBuilder writeBuilder =
+                table.underlyingTable().newBatchWriteBuilder().withOverwrite();
         try (BatchTableWrite write = writeBuilder.newWrite();
                 BatchTableCommit commit = writeBuilder.newCommit()) {
             for (FileStatus file : fileCollector) {
@@ -78,6 +78,7 @@ private static void listAllFiles(FileIO fileIO, Path directory, List<FileStatus>
     private static InternalRow toRow(FileStatus file) {
         return toRow(
                 file.getPath().toString(),
+                file.getPath().getParent().toString(),
                 file.getPath().getName(),
                 file.getLen(),
                 Timestamp.fromEpochMillis(file.getModificationTime()),
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectTable.java b/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectTable.java
index 65689108caae8..97acfe7299c51 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/object/ObjectTable.java
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.table.object;
 
+import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.manifest.ManifestCacheFilter;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.DelegatedFileStoreTable;
@@ -46,6 +47,7 @@ public interface ObjectTable extends FileStoreTable {
     RowType SCHEMA =
             RowType.builder()
                     .field("path", DataTypes.STRING().notNull())
+                    .field("parent_path", DataTypes.STRING().notNull())
                     .field("name", DataTypes.STRING().notNull())
                     .field("length", DataTypes.BIGINT().notNull())
                     .field("mtime", DataTypes.TIMESTAMP_LTZ_MILLIS())
@@ -66,11 +68,26 @@ public interface ObjectTable extends FileStoreTable {
     /** Underlying table to store metadata. */
     FileStoreTable underlyingTable();
 
+    /** File io for object file system. */
+    FileIO objectFileIO();
+
     long refresh();
 
     @Override
     ObjectTable copy(Map<String, String> dynamicOptions);
 
+    @Override
+    ObjectTable copy(TableSchema newTableSchema);
+
+    @Override
+    ObjectTable copyWithoutTimeTravel(Map<String, String> dynamicOptions);
+
+    @Override
+    ObjectTable copyWithLatestSchema();
+
+    @Override
+    ObjectTable switchToBranch(String branchName);
+
     /** Create a new builder for {@link ObjectTable}. */
     static ObjectTable.Builder builder() {
         return new ObjectTable.Builder();
@@ -80,6 +97,7 @@ static ObjectTable.Builder builder() {
     class Builder {
 
         private FileStoreTable underlyingTable;
+        private FileIO objectFileIO;
         private String objectLocation;
 
         public ObjectTable.Builder underlyingTable(FileStoreTable underlyingTable) {
@@ -93,23 +111,31 @@ public ObjectTable.Builder underlyingTable(FileStoreTable underlyingTable) {
             return this;
         }
 
+        public ObjectTable.Builder objectFileIO(FileIO objectFileIO) {
+            this.objectFileIO = objectFileIO;
+            return this;
+        }
+
         public ObjectTable.Builder objectLocation(String objectLocation) {
             this.objectLocation = objectLocation;
             return this;
         }
 
         public ObjectTable build() {
-            return new ObjectTableImpl(underlyingTable, objectLocation);
+            return new ObjectTableImpl(underlyingTable, objectFileIO, objectLocation);
         }
     }
 
     /** An implementation for {@link ObjectTable}. */
     class ObjectTableImpl extends DelegatedFileStoreTable implements ObjectTable {
 
+        private final FileIO objectFileIO;
         private final String objectLocation;
 
-        public ObjectTableImpl(FileStoreTable underlyingTable, String objectLocation) {
+        public ObjectTableImpl(
+                FileStoreTable underlyingTable, FileIO objectFileIO, String objectLocation) {
             super(underlyingTable);
+            this.objectFileIO = objectFileIO;
             this.objectLocation = objectLocation;
         }
 
@@ -148,6 +174,11 @@ public FileStoreTable underlyingTable() {
             return wrapped;
         }
 
+        @Override
+        public FileIO objectFileIO() {
+            return objectFileIO;
+        }
+
         @Override
         public long refresh() {
             try {
@@ -159,28 +190,30 @@ public long refresh() {
 
         @Override
         public ObjectTable copy(Map<String, String> dynamicOptions) {
-            return new ObjectTableImpl(wrapped.copy(dynamicOptions), objectLocation);
+            return new ObjectTableImpl(wrapped.copy(dynamicOptions), objectFileIO, objectLocation);
         }
 
         @Override
-        public FileStoreTable copy(TableSchema newTableSchema) {
-            return new ObjectTableImpl(wrapped.copy(newTableSchema), objectLocation);
+        public ObjectTable copy(TableSchema newTableSchema) {
+            return new ObjectTableImpl(wrapped.copy(newTableSchema), objectFileIO, objectLocation);
         }
 
         @Override
-        public FileStoreTable copyWithoutTimeTravel(Map<String, String> dynamicOptions) {
+        public ObjectTable copyWithoutTimeTravel(Map<String, String> dynamicOptions) {
             return new ObjectTableImpl(
-                    wrapped.copyWithoutTimeTravel(dynamicOptions), objectLocation);
+                    wrapped.copyWithoutTimeTravel(dynamicOptions), objectFileIO, objectLocation);
         }
 
         @Override
-        public FileStoreTable copyWithLatestSchema() {
-            return new ObjectTableImpl(wrapped.copyWithLatestSchema(), objectLocation);
+        public ObjectTable copyWithLatestSchema() {
+            return new ObjectTableImpl(
+                    wrapped.copyWithLatestSchema(), objectFileIO, objectLocation);
         }
 
         @Override
-        public FileStoreTable switchToBranch(String branchName) {
-            return new ObjectTableImpl(wrapped.switchToBranch(branchName), objectLocation);
+        public ObjectTable switchToBranch(String branchName) {
+            return new ObjectTableImpl(
+                    wrapped.switchToBranch(branchName), objectFileIO, objectLocation);
         }
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ObjectTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ObjectTableITCase.java
index b9e30035b093b..d3ad1d4a52f4f 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ObjectTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ObjectTableITCase.java
@@ -80,4 +80,31 @@ public void testObjectTableRefresh() throws IOException {
                 .hasMessageContaining("Object table does not support Write.");
         assertThat(sql("SELECT name, length FROM T")).containsExactlyInAnyOrder(Row.of("f1", 5L));
     }
+
+    @Test
+    public void testObjectTableRefreshInPrivileged() throws IOException {
+        sql("CALL sys.init_file_based_privilege('root-passwd')");
+
+        tEnv.executeSql(
+                String.format(
+                        "CREATE CATALOG rootcat WITH (\n"
+                                + "  'type' = 'paimon',\n"
+                                + "  'warehouse' = '%s',\n"
+                                + "  'user' = 'root',\n"
+                                + "  'password' = 'root-passwd'\n"
+                                + ")",
+                        path));
+        tEnv.useCatalog("rootcat");
+
+        Path objectLocation = new Path(path + "/object-location");
+        FileIO fileIO = LocalFileIO.create();
+        sql(
+                "CREATE TABLE T WITH ('type' = 'object-table', 'object-location' = '%s')",
+                objectLocation);
+
+        // add new file
+        fileIO.overwriteFileUtf8(new Path(objectLocation, "f0"), "1,2,3");
+        sql("CALL sys.refresh_object_table('default.T')");
+        assertThat(sql("SELECT name, length FROM T")).containsExactlyInAnyOrder(Row.of("f0", 5L));
+    }
 }

From 989a433abbf99a3b8ced274b10a95dea8937db77 Mon Sep 17 00:00:00 2001
From: Gang Yang <yanggang_IT_job@163.com>
Date: Sun, 24 Nov 2024 23:24:06 +0800
Subject: [PATCH 050/157] [Hive] Avoid excessive HMS memory usage when
 executing AlterTable for a Paimon table containing a large number of fields
 (#4549)

---
 .../org/apache/paimon/hive/HiveCatalog.java   | 21 ++++-
 .../paimon/hive/HiveTableStatsTest.java       | 94 +++++++++++++++++++
 .../hive/AlterFailHiveMetaStoreClient.java    |  8 ++
 .../hive/AlterFailHiveMetaStoreClient.java    |  8 ++
 4 files changed, 128 insertions(+), 3 deletions(-)
 create mode 100644 paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveTableStatsTest.java

diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index e936587320f3f..0f2fb6fa9d1f1 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -56,10 +56,12 @@
 import org.apache.flink.table.hive.LegacyHiveClasses;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.FileSystem;
+import org.apache.hadoop.hive.common.StatsSetupConst;
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hadoop.hive.metastore.IMetaStoreClient;
 import org.apache.hadoop.hive.metastore.TableType;
 import org.apache.hadoop.hive.metastore.api.Database;
+import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
 import org.apache.hadoop.hive.metastore.api.FieldSchema;
 import org.apache.hadoop.hive.metastore.api.NoSuchObjectException;
 import org.apache.hadoop.hive.metastore.api.SerDeInfo;
@@ -85,6 +87,7 @@
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.Objects;
 import java.util.Optional;
 import java.util.Set;
 import java.util.function.Function;
@@ -875,11 +878,23 @@ private void alterTableToHms(Table table, Identifier identifier, TableSchema new
         updateHmsTable(table, identifier, newSchema, newSchema.options().get("provider"), location);
         clients.execute(
                 client ->
-                        client.alter_table(
+                        client.alter_table_with_environmentContext(
                                 identifier.getDatabaseName(),
                                 identifier.getTableName(),
                                 table,
-                                true));
+                                createHiveEnvironmentContext()));
+    }
+
+    private EnvironmentContext createHiveEnvironmentContext() {
+        EnvironmentContext environmentContext = new EnvironmentContext();
+        environmentContext.putToProperties(StatsSetupConst.CASCADE, "true");
+        if (Objects.isNull(options)) {
+            return environmentContext;
+        }
+        environmentContext.putToProperties(
+                StatsSetupConst.DO_NOT_UPDATE_STATS,
+                options.getString(StatsSetupConst.DO_NOT_UPDATE_STATS, "false"));
+        return environmentContext;
     }
 
     @Override
@@ -1001,7 +1016,7 @@ public String warehouse() {
         return warehouse;
     }
 
-    private Table getHmsTable(Identifier identifier) throws TableNotExistException {
+    public Table getHmsTable(Identifier identifier) throws TableNotExistException {
         try {
             return clients.run(
                     client ->
diff --git a/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveTableStatsTest.java b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveTableStatsTest.java
new file mode 100644
index 0000000000000..33016fd083613
--- /dev/null
+++ b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveTableStatsTest.java
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.hive;
+
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.CatalogContext;
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.options.CatalogOptions;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.schema.SchemaChange;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.DataTypes;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.Lists;
+import org.apache.paimon.shade.guava30.com.google.common.collect.Maps;
+
+import org.apache.hadoop.hive.common.StatsSetupConst;
+import org.apache.hadoop.hive.conf.HiveConf;
+import org.apache.hadoop.hive.metastore.api.Table;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.io.TempDir;
+
+import java.util.Collections;
+import java.util.UUID;
+
+import static org.apache.hadoop.hive.conf.HiveConf.ConfVars.METASTORECONNECTURLKEY;
+import static org.assertj.core.api.Assertions.assertThat;
+
+/** Verify that table stats has been updated. */
+public class HiveTableStatsTest {
+    @TempDir java.nio.file.Path tempFile;
+    protected Catalog catalog;
+
+    @BeforeEach
+    public void setUp() throws Exception {
+        String warehouse = tempFile.toUri().toString();
+        HiveConf hiveConf = new HiveConf();
+        String jdoConnectionURL = "jdbc:derby:memory:" + UUID.randomUUID();
+        hiveConf.setVar(METASTORECONNECTURLKEY, jdoConnectionURL + ";create=true");
+        String metastoreClientClass = "org.apache.hadoop.hive.metastore.HiveMetaStoreClient";
+        Options catalogOptions = new Options();
+        catalogOptions.set(StatsSetupConst.DO_NOT_UPDATE_STATS, "true");
+        catalogOptions.set(CatalogOptions.WAREHOUSE, warehouse);
+        CatalogContext catalogContext = CatalogContext.create(catalogOptions);
+        FileIO fileIO = FileIO.get(new Path(warehouse), catalogContext);
+        catalog =
+                new HiveCatalog(fileIO, hiveConf, metastoreClientClass, catalogOptions, warehouse);
+    }
+
+    @Test
+    public void testAlterTable() throws Exception {
+        catalog.createDatabase("test_db", false);
+        // Alter table adds a new column to an existing table,but do not update stats
+        Identifier identifier = Identifier.create("test_db", "test_table");
+        catalog.createTable(
+                identifier,
+                new Schema(
+                        Lists.newArrayList(new DataField(0, "col1", DataTypes.STRING())),
+                        Collections.emptyList(),
+                        Collections.emptyList(),
+                        Maps.newHashMap(),
+                        ""),
+                false);
+        catalog.alterTable(
+                identifier,
+                Lists.newArrayList(
+                        SchemaChange.addColumn("col2", DataTypes.DATE()),
+                        SchemaChange.addColumn("col3", DataTypes.STRING(), "col3 field")),
+                false);
+        HiveCatalog hiveCatalog = (HiveCatalog) catalog;
+        Table table = hiveCatalog.getHmsTable(identifier);
+        assertThat(table.getParameters().get("COLUMN_STATS_ACCURATE")).isEqualTo(null);
+    }
+}
diff --git a/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java b/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
index ebd4684edf1bc..55e6d74084d81 100644
--- a/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
+++ b/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
@@ -22,6 +22,7 @@
 import org.apache.hadoop.hive.metastore.HiveMetaHookLoader;
 import org.apache.hadoop.hive.metastore.HiveMetaStoreClient;
 import org.apache.hadoop.hive.metastore.IMetaStoreClient;
+import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
 import org.apache.hadoop.hive.metastore.api.InvalidOperationException;
 import org.apache.hadoop.hive.metastore.api.MetaException;
 import org.apache.hadoop.hive.metastore.api.Table;
@@ -51,4 +52,11 @@ public void alter_table(
             throws InvalidOperationException, MetaException, TException {
         throw new TException();
     }
+
+    @Override
+    public void alter_table_with_environmentContext(
+            String defaultDatabaseName, String tblName, Table table, EnvironmentContext env)
+            throws InvalidOperationException, MetaException, TException {
+        throw new TException();
+    }
 }
diff --git a/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java b/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
index ae6a1bb85ac45..eab18feadacaf 100644
--- a/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
+++ b/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/hive/AlterFailHiveMetaStoreClient.java
@@ -22,6 +22,7 @@
 import org.apache.hadoop.hive.metastore.HiveMetaHookLoader;
 import org.apache.hadoop.hive.metastore.HiveMetaStoreClient;
 import org.apache.hadoop.hive.metastore.IMetaStoreClient;
+import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
 import org.apache.hadoop.hive.metastore.api.InvalidOperationException;
 import org.apache.hadoop.hive.metastore.api.MetaException;
 import org.apache.hadoop.hive.metastore.api.Table;
@@ -51,4 +52,11 @@ public void alter_table(
             throws InvalidOperationException, MetaException, TException {
         throw new TException();
     }
+
+    @Override
+    public void alter_table_with_environmentContext(
+            String defaultDatabaseName, String tblName, Table table, EnvironmentContext env)
+            throws InvalidOperationException, MetaException, TException {
+        throw new TException();
+    }
 }

From 8688206d731ea0762b82980097ca2141c9acded2 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Sun, 24 Nov 2024 23:34:01 +0800
Subject: [PATCH 051/157] [hive] Make HiveCatalog alterTable works for Hive 1.x

---
 .../paimon/hive/HiveAlterTableUtils.java      | 54 +++++++++++++++++++
 .../org/apache/paimon/hive/HiveCatalog.java   | 23 +-------
 2 files changed, 55 insertions(+), 22 deletions(-)
 create mode 100644 paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveAlterTableUtils.java

diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveAlterTableUtils.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveAlterTableUtils.java
new file mode 100644
index 0000000000000..8f77499486fd4
--- /dev/null
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveAlterTableUtils.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.hive;
+
+import org.apache.paimon.catalog.Identifier;
+
+import org.apache.hadoop.hive.common.StatsSetupConst;
+import org.apache.hadoop.hive.metastore.IMetaStoreClient;
+import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
+import org.apache.hadoop.hive.metastore.api.Table;
+import org.apache.thrift.TException;
+
+/** Utils for hive alter table. */
+public class HiveAlterTableUtils {
+
+    public static void alterTable(IMetaStoreClient client, Identifier identifier, Table table)
+            throws TException {
+        try {
+            alterTableWithEnv(client, identifier, table);
+        } catch (NoClassDefFoundError | NoSuchMethodError e) {
+            alterTableWithoutEnv(client, identifier, table);
+        }
+    }
+
+    private static void alterTableWithEnv(
+            IMetaStoreClient client, Identifier identifier, Table table) throws TException {
+        EnvironmentContext environmentContext = new EnvironmentContext();
+        environmentContext.putToProperties(StatsSetupConst.CASCADE, "true");
+        environmentContext.putToProperties(StatsSetupConst.DO_NOT_UPDATE_STATS, "false");
+        client.alter_table_with_environmentContext(
+                identifier.getDatabaseName(), identifier.getTableName(), table, environmentContext);
+    }
+
+    private static void alterTableWithoutEnv(
+            IMetaStoreClient client, Identifier identifier, Table table) throws TException {
+        client.alter_table(identifier.getDatabaseName(), identifier.getTableName(), table, true);
+    }
+}
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 0f2fb6fa9d1f1..b92c3b59d9251 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -56,12 +56,10 @@
 import org.apache.flink.table.hive.LegacyHiveClasses;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.FileSystem;
-import org.apache.hadoop.hive.common.StatsSetupConst;
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hadoop.hive.metastore.IMetaStoreClient;
 import org.apache.hadoop.hive.metastore.TableType;
 import org.apache.hadoop.hive.metastore.api.Database;
-import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
 import org.apache.hadoop.hive.metastore.api.FieldSchema;
 import org.apache.hadoop.hive.metastore.api.NoSuchObjectException;
 import org.apache.hadoop.hive.metastore.api.SerDeInfo;
@@ -87,7 +85,6 @@
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
-import java.util.Objects;
 import java.util.Optional;
 import java.util.Set;
 import java.util.function.Function;
@@ -876,25 +873,7 @@ private void alterTableToHms(Table table, Identifier identifier, TableSchema new
         updateHmsTablePars(table, newSchema);
         Path location = getTableLocation(identifier, table);
         updateHmsTable(table, identifier, newSchema, newSchema.options().get("provider"), location);
-        clients.execute(
-                client ->
-                        client.alter_table_with_environmentContext(
-                                identifier.getDatabaseName(),
-                                identifier.getTableName(),
-                                table,
-                                createHiveEnvironmentContext()));
-    }
-
-    private EnvironmentContext createHiveEnvironmentContext() {
-        EnvironmentContext environmentContext = new EnvironmentContext();
-        environmentContext.putToProperties(StatsSetupConst.CASCADE, "true");
-        if (Objects.isNull(options)) {
-            return environmentContext;
-        }
-        environmentContext.putToProperties(
-                StatsSetupConst.DO_NOT_UPDATE_STATS,
-                options.getString(StatsSetupConst.DO_NOT_UPDATE_STATS, "false"));
-        return environmentContext;
+        clients.execute(client -> HiveAlterTableUtils.alterTable(client, identifier, table));
     }
 
     @Override

From b20907ed8b9a9542901bb34a880b3ff864931e4e Mon Sep 17 00:00:00 2001
From: Kerwin <37063904+zhuangchong@users.noreply.github.com>
Date: Mon, 25 Nov 2024 10:30:22 +0800
Subject: [PATCH 052/157] [spark] Support spark to create external table sql
 statements. (#4576)

---
 .../org/apache/paimon/hive/HiveCatalog.java   | 20 ++++++---
 .../spark/SparkCatalogWithHiveTest.java       | 45 +++++++++++++++++++
 2 files changed, 60 insertions(+), 5 deletions(-)

diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index b92c3b59d9251..ebd5a1edf89b2 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -135,6 +135,7 @@ public class HiveCatalog extends AbstractCatalog {
             "org.apache.paimon.hive.PaimonStorageHandler";
     private static final String HIVE_PREFIX = "hive.";
     public static final String HIVE_SITE_FILE = "hive-site.xml";
+    private static final String HIVE_EXTERNAL_TABLE_PROP = "EXTERNAL";
 
     private final HiveConf hiveConf;
     private final String clientClassName;
@@ -218,7 +219,7 @@ private Pair<Path, Boolean> initialTableLocation(
             externalTable = true;
             location = new Path(tableOptions.get(CoreOptions.PATH.key()));
         } else {
-            externalTable = usingExternalTable();
+            externalTable = usingExternalTable(tableOptions);
             location = getTableLocation(identifier, null);
         }
         return Pair.of(location, externalTable);
@@ -659,12 +660,18 @@ public void createFormatTable(Identifier identifier, Schema schema) {
         }
     }
 
-    private boolean usingExternalTable() {
+    private boolean usingExternalTable(Map<String, String> tableOptions) {
         CatalogTableType tableType =
                 OptionsUtils.convertToEnum(
                         hiveConf.get(TABLE_TYPE.key(), CatalogTableType.MANAGED.toString()),
                         CatalogTableType.class);
-        return CatalogTableType.EXTERNAL.equals(tableType);
+
+        String externalPropValue =
+                tableOptions.getOrDefault(
+                        HIVE_EXTERNAL_TABLE_PROP.toLowerCase(),
+                        tableOptions.get(HIVE_EXTERNAL_TABLE_PROP.toUpperCase()));
+        return CatalogTableType.EXTERNAL.equals(tableType)
+                || "TRUE".equalsIgnoreCase(externalPropValue);
     }
 
     @Override
@@ -962,7 +969,10 @@ public void repairTable(Identifier identifier) throws TableNotExistException {
                 if (newTable == null) {
                     newTable =
                             createHiveTable(
-                                    identifier, tableSchema, location, usingExternalTable());
+                                    identifier,
+                                    tableSchema,
+                                    location,
+                                    usingExternalTable(tableSchema.options()));
                 }
                 Table finalNewTable = newTable;
                 clients.execute(client -> client.createTable(finalNewTable));
@@ -1081,7 +1091,7 @@ private Table newHmsTable(
             table.getParameters().put(TYPE.key(), FORMAT_TABLE.toString());
         }
         if (externalTable) {
-            table.getParameters().put("EXTERNAL", "TRUE");
+            table.getParameters().put(HIVE_EXTERNAL_TABLE_PROP, "TRUE");
         }
         return table;
     }
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java b/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
index 68cf91b8ec7b7..45ccd06479f2b 100644
--- a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
+++ b/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
@@ -19,7 +19,9 @@
 package org.apache.paimon.spark;
 
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.hive.TestHiveMetastore;
+import org.apache.paimon.table.FileStoreTableFactory;
 
 import org.apache.spark.sql.Row;
 import org.apache.spark.sql.SparkSession;
@@ -32,6 +34,7 @@
 import java.util.stream.Collectors;
 
 import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatCode;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
 /** Base tests for spark read. */
@@ -136,4 +139,46 @@ public void testSpecifyHiveConfDir(@TempDir java.nio.file.Path tempDir) {
 
         spark.close();
     }
+
+    @Test
+    public void testCreateExternalTable(@TempDir java.nio.file.Path tempDir) {
+        Path warehousePath = new Path("file:" + tempDir.toString());
+        SparkSession spark =
+                SparkSession.builder()
+                        .config("spark.sql.warehouse.dir", warehousePath.toString())
+                        // with hive metastore
+                        .config("spark.sql.catalogImplementation", "hive")
+                        .config("hive.metastore.uris", "thrift://localhost:" + PORT)
+                        .config("spark.sql.catalog.spark_catalog", SparkCatalog.class.getName())
+                        .config("spark.sql.catalog.spark_catalog.metastore", "hive")
+                        .config(
+                                "spark.sql.catalog.spark_catalog.hive.metastore.uris",
+                                "thrift://localhost:" + PORT)
+                        .config(
+                                "spark.sql.catalog.spark_catalog.warehouse",
+                                warehousePath.toString())
+                        .master("local[2]")
+                        .getOrCreate();
+
+        spark.sql("CREATE DATABASE IF NOT EXISTS test_db");
+        spark.sql("USE spark_catalog.test_db");
+
+        // create hive external table
+        spark.sql("CREATE EXTERNAL TABLE t1 (a INT, bb INT, c STRING)");
+
+        // drop hive external table
+        spark.sql("DROP TABLE t1");
+
+        // file system table exists
+        assertThatCode(
+                        () ->
+                                FileStoreTableFactory.create(
+                                        LocalFileIO.create(),
+                                        new Path(
+                                                warehousePath,
+                                                String.format("%s.db/%s", "test_db", "t1"))))
+                .doesNotThrowAnyException();
+
+        spark.close();
+    }
 }

From 63551bbda17518e28655452034cbd1676729c1b4 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 25 Nov 2024 10:58:48 +0800
Subject: [PATCH 053/157] [flink][hotfix] Wait for consumer reset before job
 close (#4578)

---
 .../apache/paimon/flink/BranchSqlITCase.java  | 13 +++++++--
 .../paimon/flink/CatalogTableITCase.java      | 12 +++++++-
 .../flink/ContinuousFileStoreITCase.java      |  9 +++++-
 .../flink/action/ConsumerActionITCase.java    | 28 ++++++++++++++-----
 4 files changed, 51 insertions(+), 11 deletions(-)

diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
index c25d99cb44591..2566fbe92e4c7 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/BranchSqlITCase.java
@@ -27,6 +27,7 @@
 import org.apache.flink.types.Row;
 import org.apache.flink.util.CloseableIterator;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
 
 import java.io.IOException;
 import java.util.ArrayList;
@@ -440,6 +441,7 @@ public void testBranchTagsTable() throws Exception {
     }
 
     @Test
+    @Timeout(60)
     public void testBranchConsumersTable() throws Exception {
         sql("CREATE TABLE t (a INT, b INT)");
         sql("INSERT INTO t VALUES (1, 2), (3,4)");
@@ -451,11 +453,18 @@ public void testBranchConsumersTable() throws Exception {
                                 "SELECT * FROM t$branch_b1 /*+ OPTIONS('consumer-id'='id1','consumer.expiration-time'='3h') */"));
         sql("INSERT INTO t$branch_b1 VALUES (5, 6), (7, 8)");
         assertThat(iterator.collect(2)).containsExactlyInAnyOrder(Row.of(5, 6), Row.of(7, 8));
+        List<String> branchResult;
+        do {
+            branchResult = collectResult("SELECT * FROM t$branch_b1$consumers");
+            if (!branchResult.isEmpty()) {
+                break;
+            }
+            Thread.sleep(1000);
+        } while (true);
         iterator.close();
 
         assertThat(collectResult("SELECT * FROM t$consumers")).isEmpty();
-        assertThat(collectResult("SELECT * FROM t$branch_b1$consumers"))
-                .containsExactlyInAnyOrder("+I[id1, 2]");
+        assertThat(branchResult).containsExactlyInAnyOrder("+I[id1, 2]");
         assertThat(collectResult("SELECT * FROM t$consumers /*+ OPTIONS('branch'='b1') */"))
                 .containsExactlyInAnyOrder("+I[id1, 2]");
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
index 8a3e068a72a02..2a855796d8d45 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
@@ -33,6 +33,7 @@
 import org.apache.flink.table.catalog.exceptions.TableNotPartitionedException;
 import org.apache.flink.types.Row;
 import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
 
 import javax.annotation.Nonnull;
 
@@ -940,6 +941,7 @@ public void testTagsTable() throws Exception {
     }
 
     @Test
+    @Timeout(60)
     public void testConsumersTable() throws Exception {
         batchSql("CREATE TABLE T (a INT, b INT)");
         batchSql("INSERT INTO T VALUES (1, 2)");
@@ -952,9 +954,17 @@ public void testConsumersTable() throws Exception {
 
         batchSql("INSERT INTO T VALUES (5, 6), (7, 8)");
         assertThat(iterator.collect(2)).containsExactlyInAnyOrder(Row.of(1, 2), Row.of(3, 4));
+
+        List<Row> result;
+        do {
+            result = sql("SELECT * FROM T$consumers");
+            if (!result.isEmpty()) {
+                break;
+            }
+            Thread.sleep(1000);
+        } while (true);
         iterator.close();
 
-        List<Row> result = sql("SELECT * FROM T$consumers");
         assertThat(result).hasSize(1);
         assertThat(result.get(0).getField(0)).isEqualTo("my1");
         assertThat((Long) result.get(0).getField(1)).isGreaterThanOrEqualTo(3);
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
index 2e15697511dd0..b448858328041 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ContinuousFileStoreITCase.java
@@ -120,7 +120,14 @@ public void testConsumerId() throws Exception {
         assertThat(iterator.collect(2))
                 .containsExactlyInAnyOrder(Row.of("1", "2", "3"), Row.of("4", "5", "6"));
 
-        Thread.sleep(1000);
+        List<Row> result;
+        do {
+            result = sql("SELECT * FROM %s$consumers", table);
+            if (!result.isEmpty()) {
+                break;
+            }
+            Thread.sleep(1000);
+        } while (true);
         iterator.close();
 
         iterator =
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/ConsumerActionITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/ConsumerActionITCase.java
index e2243ddf269a5..6fb8c81eb7440 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/ConsumerActionITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/ConsumerActionITCase.java
@@ -26,8 +26,11 @@
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.BlockingIterator;
 
 import org.apache.flink.table.api.TableException;
+import org.apache.flink.types.Row;
+import org.junit.jupiter.api.Timeout;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.ValueSource;
 
@@ -46,6 +49,7 @@
 public class ConsumerActionITCase extends ActionITCaseBase {
 
     @ParameterizedTest
+    @Timeout(60)
     @ValueSource(strings = {"action", "procedure_indexed", "procedure_named"})
     public void testResetConsumer(String invoker) throws Exception {
         init(warehouse);
@@ -72,18 +76,22 @@ public void testResetConsumer(String invoker) throws Exception {
         writeData(rowData(3L, BinaryString.fromString("Paimon")));
 
         // use consumer streaming read table
-        testStreamingRead(
+        BlockingIterator<Row, Row> iterator =
+                testStreamingRead(
                         "SELECT * FROM `"
                                 + tableName
                                 + "` /*+ OPTIONS('consumer-id'='myid','consumer.expiration-time'='3h') */",
                         Arrays.asList(
                                 changelogRow("+I", 1L, "Hi"),
                                 changelogRow("+I", 2L, "Hello"),
-                                changelogRow("+I", 3L, "Paimon")))
-                .close();
+                                changelogRow("+I", 3L, "Paimon")));
 
-        Thread.sleep(1000);
         ConsumerManager consumerManager = new ConsumerManager(table.fileIO(), table.location());
+        while (!consumerManager.consumer("myid").isPresent()) {
+            Thread.sleep(1000);
+        }
+        iterator.close();
+
         Optional<Consumer> consumer1 = consumerManager.consumer("myid");
         assertThat(consumer1).isPresent();
         assertThat(consumer1.get().nextSnapshot()).isEqualTo(4);
@@ -191,6 +199,7 @@ public void testResetConsumer(String invoker) throws Exception {
     }
 
     @ParameterizedTest
+    @Timeout(60)
     @ValueSource(strings = {"action", "procedure_indexed", "procedure_named"})
     public void testResetBranchConsumer(String invoker) throws Exception {
         init(warehouse);
@@ -222,18 +231,23 @@ public void testResetBranchConsumer(String invoker) throws Exception {
         String branchTableName = tableName + "$branch_b1";
 
         // use consumer streaming read table
-        testStreamingRead(
+        BlockingIterator<Row, Row> iterator =
+                testStreamingRead(
                         "SELECT * FROM `"
                                 + branchTableName
                                 + "` /*+ OPTIONS('consumer-id'='myid','consumer.expiration-time'='3h') */",
                         Arrays.asList(
                                 changelogRow("+I", 1L, "Hi"),
                                 changelogRow("+I", 2L, "Hello"),
-                                changelogRow("+I", 3L, "Paimon")))
-                .close();
+                                changelogRow("+I", 3L, "Paimon")));
 
         ConsumerManager consumerManager =
                 new ConsumerManager(table.fileIO(), table.location(), branchName);
+        while (!consumerManager.consumer("myid").isPresent()) {
+            Thread.sleep(1000);
+        }
+        iterator.close();
+
         Optional<Consumer> consumer1 = consumerManager.consumer("myid");
         assertThat(consumer1).isPresent();
         assertThat(consumer1.get().nextSnapshot()).isEqualTo(4);

From be2488672711c9a8ec70bf005dc1d8a98f993c16 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 25 Nov 2024 10:59:20 +0800
Subject: [PATCH 054/157] [flink][cdc] Update flink dependency to 1.20 (#4580)

---
 paimon-flink/paimon-flink-cdc/pom.xml         | 11 ++++--
 .../streamrecord/RecordAttributes.java        | 22 ------------
 .../catalog/CatalogMaterializedTable.java     | 34 -------------------
 3 files changed, 9 insertions(+), 58 deletions(-)
 delete mode 100644 paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/streaming/runtime/streamrecord/RecordAttributes.java
 delete mode 100644 paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/table/catalog/CatalogMaterializedTable.java

diff --git a/paimon-flink/paimon-flink-cdc/pom.xml b/paimon-flink/paimon-flink-cdc/pom.xml
index 7f5bb3e786da8..792c6c14378be 100644
--- a/paimon-flink/paimon-flink-cdc/pom.xml
+++ b/paimon-flink/paimon-flink-cdc/pom.xml
@@ -34,7 +34,7 @@ under the License.
     <name>Paimon : Flink : CDC</name>
 
     <properties>
-        <flink.version>1.18.1</flink.version>
+        <flink.version>1.20.0</flink.version>
         <flink.cdc.version>3.1.1</flink.cdc.version>
         <flink.mongodb.cdc.version>3.1.1</flink.mongodb.cdc.version>
         <avro.version>1.11.4</avro.version>
@@ -43,7 +43,7 @@ under the License.
         <mongodb.testcontainers.version>1.19.1</mongodb.testcontainers.version>
         <flink.connector.pulsar.version>4.0.0-1.17</flink.connector.pulsar.version>
         <confluent.platform.version>7.5.0</confluent.platform.version>
-        <flink.connector.kafka.version>3.0.1-1.18</flink.connector.kafka.version>
+        <flink.connector.kafka.version>3.3.0-1.20</flink.connector.kafka.version>
     </properties>
 
     <repositories>
@@ -167,6 +167,13 @@ under the License.
 
         <!-- test dependencies -->
 
+        <dependency>
+            <groupId>commons-codec</groupId>
+            <artifactId>commons-codec</artifactId>
+            <version>1.9</version>
+            <scope>test</scope>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-common</artifactId>
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/streaming/runtime/streamrecord/RecordAttributes.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/streaming/runtime/streamrecord/RecordAttributes.java
deleted file mode 100644
index 723c71dc565d7..0000000000000
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/streaming/runtime/streamrecord/RecordAttributes.java
+++ /dev/null
@@ -1,22 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.flink.streaming.runtime.streamrecord;
-
-/** Placeholder class for new feature introduced since flink 1.19. Should never be used. */
-public class RecordAttributes extends StreamElement {}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/table/catalog/CatalogMaterializedTable.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/table/catalog/CatalogMaterializedTable.java
deleted file mode 100644
index 6eabd1db7f382..0000000000000
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/flink/table/catalog/CatalogMaterializedTable.java
+++ /dev/null
@@ -1,34 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.flink.table.catalog;
-
-/**
- * Dummy placeholder to resolve compatibility issue of CatalogMaterializedTable(introduced in flink
- * 1.20).
- */
-public interface CatalogMaterializedTable extends CatalogBaseTable {
-    /** Dummy LogicalRefreshMode placeholder. */
-    enum LogicalRefreshMode {}
-
-    /** Dummy RefreshMode placeholder. */
-    enum RefreshMode {}
-
-    /** Dummy RefreshStatus placeholder. */
-    enum RefreshStatus {}
-}

From 253378850431ca97687847199e900d908e04e6df Mon Sep 17 00:00:00 2001
From: Kerwin <37063904+zhuangchong@users.noreply.github.com>
Date: Mon, 25 Nov 2024 13:31:25 +0800
Subject: [PATCH 055/157] [hive] Improve paimon format table conversion hive
 table in hive catalog. (#4522)

---
 .../org/apache/paimon/table/FormatTable.java  |  14 ++
 .../org/apache/paimon/hive/HiveCatalog.java   | 124 +++++++++---------
 .../apache/paimon/hive/HiveCatalogTest.java   |   4 +-
 3 files changed, 76 insertions(+), 66 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/FormatTable.java b/paimon-core/src/main/java/org/apache/paimon/table/FormatTable.java
index a53ba545c25e4..a4c7788c38afe 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/FormatTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/FormatTable.java
@@ -34,6 +34,7 @@
 import javax.annotation.Nullable;
 
 import java.time.Duration;
+import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
@@ -70,6 +71,19 @@ enum Format {
         CSV
     }
 
+    /** Parses a file format string to a corresponding {@link Format} enum constant. */
+    static Format parseFormat(String fileFormat) {
+        try {
+            return Format.valueOf(fileFormat.toUpperCase());
+        } catch (IllegalArgumentException e) {
+            throw new UnsupportedOperationException(
+                    "Format table unsupported file format: "
+                            + fileFormat
+                            + ". Supported formats: "
+                            + Arrays.toString(Format.values()));
+        }
+    }
+
     /** Create a new builder for {@link FormatTable}. */
     static FormatTable.Builder builder() {
         return new FormatTable.Builder();
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index ebd5a1edf89b2..0ecc78469e154 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -112,7 +112,6 @@
 import static org.apache.paimon.utils.BranchManager.DEFAULT_MAIN_BRANCH;
 import static org.apache.paimon.utils.HadoopUtils.addHadoopConfIfFound;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
-import static org.apache.paimon.utils.Preconditions.checkNotNull;
 import static org.apache.paimon.utils.StringUtils.isNullOrWhitespaceOnly;
 
 /** A catalog implementation for Hive. */
@@ -122,7 +121,7 @@ public class HiveCatalog extends AbstractCatalog {
 
     // Reserved properties
     public static final String TABLE_TYPE_PROP = "table_type";
-    public static final String PAIMON_TABLE_TYPE_VALUE = "paimon";
+    public static final String PAIMON_TABLE_IDENTIFIER = "PAIMON";
 
     // we don't include paimon-hive-connector as dependencies because it depends on
     // hive-exec
@@ -766,33 +765,24 @@ private Table createHiveTable(
             }
         }
 
-        Table table =
-                newHmsTable(identifier, tblProperties, PAIMON_TABLE_TYPE_VALUE, externalTable);
-        updateHmsTable(table, identifier, tableSchema, PAIMON_TABLE_TYPE_VALUE, location);
+        Table table = newHmsTable(identifier, tblProperties, null, externalTable);
+        updateHmsTable(table, identifier, tableSchema, null, location);
         return table;
     }
 
     private Table createHiveFormatTable(
             Identifier identifier, TableSchema tableSchema, Path location, boolean externalTable) {
-        Options options = Options.fromMap(tableSchema.options());
-        checkArgument(options.get(TYPE) == FORMAT_TABLE);
+        CoreOptions coreOptions = new CoreOptions(tableSchema.options());
+        checkArgument(coreOptions.type() == FORMAT_TABLE);
 
-        String provider = tableSchema.options().get(FILE_FORMAT.key());
-        checkNotNull(provider, FILE_FORMAT.key() + " should be configured.");
-        // valid supported format
-        FormatTable.Format.valueOf(provider.toUpperCase());
+        // file.format option has a default value and cannot be empty.
+        FormatTable.Format provider = FormatTable.parseFormat(coreOptions.formatType());
 
         Map<String, String> tblProperties = new HashMap<>();
 
         Table table = newHmsTable(identifier, tblProperties, provider, externalTable);
         updateHmsTable(table, identifier, tableSchema, provider, location);
 
-        if (FormatTable.Format.CSV.toString().equalsIgnoreCase(provider)) {
-            table.getSd()
-                    .getSerdeInfo()
-                    .getParameters()
-                    .put(FIELD_DELIM, options.get(FIELD_DELIMITER));
-        }
         return table;
     }
 
@@ -879,7 +869,8 @@ private void alterTableToHms(Table table, Identifier identifier, TableSchema new
             throws TException, InterruptedException {
         updateHmsTablePars(table, newSchema);
         Path location = getTableLocation(identifier, table);
-        updateHmsTable(table, identifier, newSchema, newSchema.options().get("provider"), location);
+        // file format is null, because only data table support alter table.
+        updateHmsTable(table, identifier, newSchema, null, location);
         clients.execute(client -> HiveAlterTableUtils.alterTable(client, identifier, table));
     }
 
@@ -1059,12 +1050,9 @@ private boolean isExternalTable(Table table) {
     private Table newHmsTable(
             Identifier identifier,
             Map<String, String> tableParameters,
-            String provider,
+            @Nullable FormatTable.Format provider,
             boolean externalTable) {
         long currentTimeMillis = System.currentTimeMillis();
-        if (provider == null) {
-            provider = PAIMON_TABLE_TYPE_VALUE;
-        }
         Table table =
                 new Table(
                         identifier.getTableName(),
@@ -1082,67 +1070,83 @@ private Table newHmsTable(
                         externalTable
                                 ? TableType.EXTERNAL_TABLE.name()
                                 : TableType.MANAGED_TABLE.name());
-        table.getParameters().put(TABLE_TYPE_PROP, provider.toUpperCase());
-        if (PAIMON_TABLE_TYPE_VALUE.equalsIgnoreCase(provider)) {
+
+        if (provider == null) {
+            // normal paimon table
+            table.getParameters().put(TABLE_TYPE_PROP, PAIMON_TABLE_IDENTIFIER);
             table.getParameters()
                     .put(hive_metastoreConstants.META_TABLE_STORAGE, STORAGE_HANDLER_CLASS_NAME);
         } else {
-            table.getParameters().put(FILE_FORMAT.key(), provider.toLowerCase());
+            // format table
+            table.getParameters().put(TABLE_TYPE_PROP, provider.name());
+            table.getParameters().put(FILE_FORMAT.key(), provider.name().toLowerCase());
             table.getParameters().put(TYPE.key(), FORMAT_TABLE.toString());
         }
+
         if (externalTable) {
             table.getParameters().put(HIVE_EXTERNAL_TABLE_PROP, "TRUE");
         }
         return table;
     }
 
-    private String getSerdeClassName(String provider) {
-        if (provider == null || provider.equalsIgnoreCase(PAIMON_TABLE_TYPE_VALUE)) {
-            return SERDE_CLASS_NAME;
-        } else if (provider.equalsIgnoreCase("csv")) {
-            return "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe";
-        } else if (provider.equalsIgnoreCase("parquet")) {
-            return "org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe";
-        } else if (provider.equalsIgnoreCase("orc")) {
-            return "org.apache.hadoop.hive.ql.io.orc.OrcSerde";
-        } else {
+    private String getSerdeClassName(@Nullable FormatTable.Format provider) {
+        if (provider == null) {
             return SERDE_CLASS_NAME;
         }
+        switch (provider) {
+            case CSV:
+                return "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe";
+            case PARQUET:
+                return "org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe";
+            case ORC:
+                return "org.apache.hadoop.hive.ql.io.orc.OrcSerde";
+        }
+        return SERDE_CLASS_NAME;
     }
 
-    private String getInputFormatName(String provider) {
-        if (provider == null || provider.equalsIgnoreCase(PAIMON_TABLE_TYPE_VALUE)) {
-            return INPUT_FORMAT_CLASS_NAME;
-        } else if (provider.equalsIgnoreCase("csv")) {
-            return "org.apache.hadoop.mapred.TextInputFormat";
-        } else if (provider.equalsIgnoreCase("parquet")) {
-            return "org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat";
-        } else if (provider.equalsIgnoreCase("orc")) {
-            return "org.apache.hadoop.hive.ql.io.orc.OrcInputFormat";
-        } else {
+    private String getInputFormatName(@Nullable FormatTable.Format provider) {
+        if (provider == null) {
             return INPUT_FORMAT_CLASS_NAME;
         }
+        switch (provider) {
+            case CSV:
+                return "org.apache.hadoop.mapred.TextInputFormat";
+            case PARQUET:
+                return "org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat";
+            case ORC:
+                return "org.apache.hadoop.hive.ql.io.orc.OrcInputFormat";
+        }
+        return INPUT_FORMAT_CLASS_NAME;
     }
 
-    private String getOutputFormatClassName(String provider) {
-        if (provider == null || provider.equalsIgnoreCase(PAIMON_TABLE_TYPE_VALUE)) {
-            return OUTPUT_FORMAT_CLASS_NAME;
-        } else if (provider.equalsIgnoreCase("csv")) {
-            return "org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat";
-        } else if (provider.equalsIgnoreCase("parquet")) {
-            return "org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat";
-        } else if (provider.equalsIgnoreCase("orc")) {
-            return "org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat";
-        } else {
+    private String getOutputFormatClassName(@Nullable FormatTable.Format provider) {
+        if (provider == null) {
             return OUTPUT_FORMAT_CLASS_NAME;
         }
+        switch (provider) {
+            case CSV:
+                return "org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat";
+            case PARQUET:
+                return "org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat";
+            case ORC:
+                return "org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat";
+        }
+        return OUTPUT_FORMAT_CLASS_NAME;
+    }
+
+    private Map<String, String> setSerDeInfoParam(@Nullable FormatTable.Format provider) {
+        Map<String, String> param = new HashMap<>();
+        if (provider == FormatTable.Format.CSV) {
+            param.put(FIELD_DELIM, options.get(FIELD_DELIMITER));
+        }
+        return param;
     }
 
     private void updateHmsTable(
             Table table,
             Identifier identifier,
             TableSchema schema,
-            String provider,
+            @Nullable FormatTable.Format provider,
             Path location) {
         StorageDescriptor sd = table.getSd() != null ? table.getSd() : new StorageDescriptor();
 
@@ -1206,14 +1210,6 @@ private void updateHmsTable(
         locationHelper.specifyTableLocation(table, location.toString());
     }
 
-    private Map<String, String> setSerDeInfoParam(String provider) {
-        Map<String, String> param = new HashMap<>();
-        if (provider != null && provider.equalsIgnoreCase("csv")) {
-            param.put(FIELD_DELIM, options.get(FIELD_DELIMITER));
-        }
-        return param;
-    }
-
     private void updateHmsTablePars(Table table, TableSchema schema) {
         if (syncAllProperties()) {
             table.getParameters().putAll(schema.options());
diff --git a/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
index 3ba3f89e412fc..267bdf0c71002 100644
--- a/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
+++ b/paimon-hive/paimon-hive-catalog/src/test/java/org/apache/paimon/hive/HiveCatalogTest.java
@@ -55,7 +55,7 @@
 import java.util.concurrent.atomic.AtomicBoolean;
 
 import static org.apache.hadoop.hive.conf.HiveConf.ConfVars.METASTORECONNECTURLKEY;
-import static org.apache.paimon.hive.HiveCatalog.PAIMON_TABLE_TYPE_VALUE;
+import static org.apache.paimon.hive.HiveCatalog.PAIMON_TABLE_IDENTIFIER;
 import static org.apache.paimon.hive.HiveCatalog.TABLE_TYPE_PROP;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
@@ -218,7 +218,7 @@ public void testAddHiveTableParameters() {
             assertThat(tableProperties).containsEntry("comment", "this is a hive table");
             assertThat(tableProperties)
                     .containsEntry(
-                            TABLE_TYPE_PROP, PAIMON_TABLE_TYPE_VALUE.toUpperCase(Locale.ROOT));
+                            TABLE_TYPE_PROP, PAIMON_TABLE_IDENTIFIER.toUpperCase(Locale.ROOT));
         } catch (Exception e) {
             fail("Test failed due to exception: " + e.getMessage());
         }

From dc9849f87f098cddffa52889a95e29620ad3ecc3 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Mon, 25 Nov 2024 14:25:41 +0800
Subject: [PATCH 056/157] [doc] Move Catalog API together with Java API

---
 docs/content/program-api/catalog-api.md | 2 +-
 docs/content/program-api/python-api.md  | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/content/program-api/catalog-api.md b/docs/content/program-api/catalog-api.md
index d016cfa7b2049..570577437d865 100644
--- a/docs/content/program-api/catalog-api.md
+++ b/docs/content/program-api/catalog-api.md
@@ -1,6 +1,6 @@
 ---
 title: "Catalog API"
-weight: 4
+weight: 3
 type: docs
 aliases:
 - /api/catalog-api.html
diff --git a/docs/content/program-api/python-api.md b/docs/content/program-api/python-api.md
index 940e8cb52b4d3..ff457cc55f446 100644
--- a/docs/content/program-api/python-api.md
+++ b/docs/content/program-api/python-api.md
@@ -1,6 +1,6 @@
 ---
 title: "Python API"
-weight: 3
+weight: 4
 type: docs
 aliases:
 - /api/python-api.html

From d9a1b80a41169c41eb2628790d8bc4e7fc68467c Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Mon, 25 Nov 2024 15:23:44 +0800
Subject: [PATCH 057/157] [doc] Document changelog producer to use lookup

---
 .../primary-key-table/changelog-producer.md   | 25 +++++++++++--------
 1 file changed, 15 insertions(+), 10 deletions(-)

diff --git a/docs/content/primary-key-table/changelog-producer.md b/docs/content/primary-key-table/changelog-producer.md
index bf7a23fae2a54..011f7b6f27a7f 100644
--- a/docs/content/primary-key-table/changelog-producer.md
+++ b/docs/content/primary-key-table/changelog-producer.md
@@ -58,9 +58,11 @@ By specifying `'changelog-producer' = 'input'`, Paimon writers rely on their inp
 
 ## Lookup
 
-If your input can’t produce a complete changelog but you still want to get rid of the costly normalized operator, you may consider using the `'lookup'` changelog producer.
+If your input can’t produce a complete changelog but you still want to get rid of the costly normalized operator, you
+may consider using the `'lookup'` changelog producer.
 
-By specifying `'changelog-producer' = 'lookup'`, Paimon will generate changelog through `'lookup'` before committing the data writing.
+By specifying `'changelog-producer' = 'lookup'`, Paimon will generate changelog through `'lookup'` before committing
+the data writing (You can also enable [Async Compaction]({{< ref "primary-key-table/compaction#asynchronous-compaction" >}})).
 
 {{< img src="/img/changelog-producer-lookup.png">}}
 
@@ -105,23 +107,26 @@ important for performance).
 
 ## Full Compaction
 
-If you think the resource consumption of 'lookup' is too large, you can consider using 'full-compaction' changelog producer,
-which can decouple data writing and changelog generation, and is more suitable for scenarios with high latency (For example, 10 minutes).
+You can also consider using 'full-compaction' changelog producer to generate changelog, and is more suitable for scenarios
+with large latency (For example, 30 minutes).
 
-By specifying `'changelog-producer' = 'full-compaction'`, Paimon will compare the results between full compactions and produce the differences as changelog. The latency of changelog is affected by the frequency of full compactions.
+1. By specifying `'changelog-producer' = 'full-compaction'`, Paimon will compare the results between full compactions and
+produce the differences as changelog. The latency of changelog is affected by the frequency of full compactions.
+2. By specifying `full-compaction.delta-commits` table property, full compaction will be constantly triggered after delta
+commits (checkpoints). This is set to 1 by default, so each checkpoint will have a full compression and generate a
+changelog.
 
-By specifying `full-compaction.delta-commits` table property, full compaction will be constantly triggered after delta commits (checkpoints). This is set to 1 by default, so each checkpoint will have a full compression and generate a change log.
+Generally speaking, the cost and consumption of full compaction are high, so we recommend using `'lookup'` changelog
+producer.
 
 {{< img src="/img/changelog-producer-full-compaction.png">}}
 
 {{< hint info >}}
 
-Full compaction changelog producer can produce complete changelog for any type of source. However it is not as efficient as the input changelog producer and the latency to produce changelog might be high.
+Full compaction changelog producer can produce complete changelog for any type of source. However it is not as
+efficient as the input changelog producer and the latency to produce changelog might be high.
 
 {{< /hint >}}
 
 Full-compaction changelog-producer supports `changelog-producer.row-deduplicate` to avoid generating -U, +U
 changelog for the same record.
-
-(Note: Please increase `'execution.checkpointing.max-concurrent-checkpoints'` Flink configuration, this is very
-important for performance).

From 76a4134838058559fbba2f6a022d7aa3efcd45b0 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 25 Nov 2024 20:10:38 +0800
Subject: [PATCH 058/157] [flink] Adopt open(OpenContext) in RichFunction
 (#4581)

---
 .../api/common/functions/OpenContext.java     | 29 +++++++++++++++++++
 .../api/common/functions/OpenContext.java     | 29 +++++++++++++++++++
 .../api/common/functions/OpenContext.java     | 29 +++++++++++++++++++
 .../api/common/functions/OpenContext.java     | 29 +++++++++++++++++++
 .../paimon/flink/kafka/KafkaSinkFunction.java | 12 +++++++-
 ...CdcDynamicTableParsingProcessFunction.java | 12 +++++++-
 .../CdcMultiTableParsingProcessFunction.java  | 12 +++++++-
 .../sink/cdc/CdcParsingProcessFunction.java   | 12 +++++++-
 .../UpdatedDataFieldsProcessFunctionBase.java | 12 +++++++-
 .../flink/service/QueryAddressRegister.java   | 12 +++++++-
 .../flink/service/QueryFileMonitor.java       | 12 +++++++-
 .../paimon/flink/shuffle/RangeShuffle.java    | 15 ++++++++--
 .../flink/sink/RowDataStoreWriteOperator.java | 28 ++++++++++++++----
 .../apache/paimon/flink/sorter/SortUtils.java | 28 ++++++++++++++++--
 .../source/BucketUnawareCompactSource.java    | 12 +++++++-
 .../CombinedAwareBatchSourceFunction.java     | 12 +++++++-
 .../CombinedAwareStreamingSourceFunction.java | 12 +++++++-
 .../CombinedCompactorSourceFunction.java      | 12 +++++++-
 .../CombinedUnawareBatchSourceFunction.java   | 12 +++++++-
 ...ombinedUnawareStreamingSourceFunction.java | 12 +++++++-
 20 files changed, 319 insertions(+), 24 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/functions/OpenContext.java

diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/functions/OpenContext.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
new file mode 100644
index 0000000000000..4ff5484b3b087
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.functions;
+
+import org.apache.flink.annotation.PublicEvolving;
+
+/**
+ * The {@link OpenContext} interface provides necessary information required by the {@link
+ * RichFunction} when it is opened. The {@link OpenContext} is currently empty because it can be
+ * used to add more methods without affecting the signature of {@code RichFunction#open}.
+ */
+@PublicEvolving
+public interface OpenContext {}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/functions/OpenContext.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
new file mode 100644
index 0000000000000..4ff5484b3b087
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.functions;
+
+import org.apache.flink.annotation.PublicEvolving;
+
+/**
+ * The {@link OpenContext} interface provides necessary information required by the {@link
+ * RichFunction} when it is opened. The {@link OpenContext} is currently empty because it can be
+ * used to add more methods without affecting the signature of {@code RichFunction#open}.
+ */
+@PublicEvolving
+public interface OpenContext {}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/functions/OpenContext.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
new file mode 100644
index 0000000000000..4ff5484b3b087
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.functions;
+
+import org.apache.flink.annotation.PublicEvolving;
+
+/**
+ * The {@link OpenContext} interface provides necessary information required by the {@link
+ * RichFunction} when it is opened. The {@link OpenContext} is currently empty because it can be
+ * used to add more methods without affecting the signature of {@code RichFunction#open}.
+ */
+@PublicEvolving
+public interface OpenContext {}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/functions/OpenContext.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
new file mode 100644
index 0000000000000..4ff5484b3b087
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/functions/OpenContext.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.functions;
+
+import org.apache.flink.annotation.PublicEvolving;
+
+/**
+ * The {@link OpenContext} interface provides necessary information required by the {@link
+ * RichFunction} when it is opened. The {@link OpenContext} is currently empty because it can be
+ * used to add more methods without affecting the signature of {@code RichFunction#open}.
+ */
+@PublicEvolving
+public interface OpenContext {}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/kafka/KafkaSinkFunction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/kafka/KafkaSinkFunction.java
index 72a177adceaf3..41e7141cf48a8 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/kafka/KafkaSinkFunction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/kafka/KafkaSinkFunction.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.flink.sink.LogSinkFunction;
 import org.apache.paimon.table.sink.SinkRecord;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.connectors.kafka.FlinkKafkaException;
 import org.apache.flink.streaming.connectors.kafka.FlinkKafkaProducer;
@@ -65,7 +66,16 @@ public void setWriteCallback(WriteCallback writeCallback) {
         this.writeCallback = writeCallback;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration configuration) throws Exception {
         super.open(configuration);
         Callback baseCallback = requireNonNull(callback);
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicTableParsingProcessFunction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicTableParsingProcessFunction.java
index 0961ff160048d..886e33e2046aa 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicTableParsingProcessFunction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicTableParsingProcessFunction.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.types.DataField;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.typeinfo.TypeHint;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.java.tuple.Tuple2;
@@ -74,7 +75,16 @@ public CdcDynamicTableParsingProcessFunction(
         this.parserFactory = parserFactory;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         parser = parserFactory.create();
         catalog = catalogLoader.load();
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcMultiTableParsingProcessFunction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcMultiTableParsingProcessFunction.java
index b18a05c280cbf..4c5e0600bb47e 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcMultiTableParsingProcessFunction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcMultiTableParsingProcessFunction.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.types.DataField;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.java.typeutils.ListTypeInfo;
 import org.apache.flink.configuration.Configuration;
@@ -51,7 +52,16 @@ public CdcMultiTableParsingProcessFunction(EventParser.Factory<T> parserFactory)
         this.parserFactory = parserFactory;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         parser = parserFactory.create();
         updatedDataFieldsOutputTags = new HashMap<>();
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcParsingProcessFunction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcParsingProcessFunction.java
index 3456634942c8d..eec228f3c09bb 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcParsingProcessFunction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcParsingProcessFunction.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.types.DataField;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.java.typeutils.ListTypeInfo;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.functions.ProcessFunction;
@@ -50,7 +51,16 @@ public CdcParsingProcessFunction(EventParser.Factory<T> parserFactory) {
         this.parserFactory = parserFactory;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         parser = parserFactory.create();
     }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
index c2e928bd4a0aa..4f02b784c2ba6 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunctionBase.java
@@ -31,6 +31,7 @@
 import org.apache.paimon.utils.Preconditions;
 import org.apache.paimon.utils.StringUtils;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.functions.ProcessFunction;
 import org.slf4j.Logger;
@@ -73,7 +74,16 @@ protected UpdatedDataFieldsProcessFunctionBase(Catalog.Loader catalogLoader) {
         this.catalogLoader = catalogLoader;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) {
         this.catalog = catalogLoader.load();
         this.allowUpperCase = this.catalog.allowUpperCase();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
index df3cf7abf2a5f..524f2e5f01c17 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.functions.sink.RichSinkFunction;
 import org.apache.flink.streaming.api.functions.sink.SinkFunction;
@@ -44,7 +45,16 @@ public QueryAddressRegister(Table table) {
         this.serviceManager = ((FileStoreTable) table).store().newServiceManager();
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         this.executors = new TreeMap<>();
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
index 43cf654e91fe6..02f8a654112ea 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
@@ -31,6 +31,7 @@
 import org.apache.paimon.table.source.TableRead;
 import org.apache.paimon.table.system.FileMonitorTable;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
@@ -70,7 +71,16 @@ public QueryFileMonitor(Table table) {
                         .toMillis();
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         FileMonitorTable monitorTable = new FileMonitorTable((FileStoreTable) table);
         ReadBuilder readBuilder = monitorTable.newReadBuilder();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/shuffle/RangeShuffle.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/shuffle/RangeShuffle.java
index 54104130438bf..8760f1dc5f804 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/shuffle/RangeShuffle.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/shuffle/RangeShuffle.java
@@ -27,6 +27,7 @@
 import org.apache.paimon.utils.SerializableSupplier;
 
 import org.apache.flink.annotation.Internal;
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.functions.Partitioner;
 import org.apache.flink.api.common.functions.RichMapFunction;
 import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
@@ -182,9 +183,19 @@ public KeyAndSizeExtractor(RowType rowType, boolean isSortBySize) {
             this.isSortBySize = isSortBySize;
         }
 
-        @Override
+        /**
+         * Do not annotate with <code>@override</code> here to maintain compatibility with Flink
+         * 1.18-.
+         */
+        public void open(OpenContext openContext) throws Exception {
+            open(new Configuration());
+        }
+
+        /**
+         * Do not annotate with <code>@override</code> here to maintain compatibility with Flink
+         * 2.0+.
+         */
         public void open(Configuration parameters) throws Exception {
-            super.open(parameters);
             InternalRowToSizeVisitor internalRowToSizeVisitor = new InternalRowToSizeVisitor();
             fieldSizeCalculator =
                     rowType.getFieldTypes().stream()
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
index 07fe275543a18..2b25f074667c3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
@@ -23,6 +23,8 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.sink.SinkRecord;
 
+import org.apache.flink.api.common.functions.Function;
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.functions.RichFunction;
 import org.apache.flink.api.common.functions.util.FunctionUtils;
 import org.apache.flink.api.common.state.CheckpointListener;
@@ -42,6 +44,8 @@
 import javax.annotation.Nullable;
 
 import java.io.IOException;
+import java.lang.reflect.InvocationTargetException;
+import java.lang.reflect.Method;
 import java.util.List;
 import java.util.Objects;
 
@@ -97,17 +101,29 @@ public void open() throws Exception {
 
         this.sinkContext = new SimpleContext(getProcessingTimeService());
         if (logSinkFunction != null) {
-            // to stay compatible with Flink 1.18-
-            if (logSinkFunction instanceof RichFunction) {
-                RichFunction richFunction = (RichFunction) logSinkFunction;
-                richFunction.open(new Configuration());
-            }
-
+            openFunction(logSinkFunction);
             logCallback = new LogWriteCallback();
             logSinkFunction.setWriteCallback(logCallback);
         }
     }
 
+    private static void openFunction(Function function) throws Exception {
+        if (function instanceof RichFunction) {
+            RichFunction richFunction = (RichFunction) function;
+
+            try {
+                Method method = RichFunction.class.getDeclaredMethod("open", OpenContext.class);
+                method.invoke(richFunction, new OpenContext() {});
+                return;
+            } catch (NoSuchMethodException | IllegalAccessException | InvocationTargetException e) {
+                // to stay compatible with Flink 1.18-
+            }
+
+            Method method = RichFunction.class.getDeclaredMethod("open", Configuration.class);
+            method.invoke(richFunction, new Configuration());
+        }
+    }
+
     @Override
     public void processWatermark(Watermark mark) throws Exception {
         super.processWatermark(mark);
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortUtils.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortUtils.java
index f590c2fb7fff0..b30e145512966 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortUtils.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortUtils.java
@@ -31,6 +31,7 @@
 import org.apache.paimon.utils.KeyProjectedRow;
 import org.apache.paimon.utils.SerializableSupplier;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.functions.RichMapFunction;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.java.tuple.Tuple2;
@@ -119,9 +120,19 @@ public static <KEY> DataStream<RowData> sortStreamByKey(
                         .map(
                                 new RichMapFunction<RowData, Tuple2<KEY, RowData>>() {
 
-                                    @Override
+                                    /**
+                                     * Do not annotate with <code>@override</code> here to maintain
+                                     * compatibility with Flink 1.18-.
+                                     */
+                                    public void open(OpenContext openContext) throws Exception {
+                                        open(new Configuration());
+                                    }
+
+                                    /**
+                                     * Do not annotate with <code>@override</code> here to maintain
+                                     * compatibility with Flink 2.0+.
+                                     */
                                     public void open(Configuration parameters) throws Exception {
-                                        super.open(parameters);
                                         shuffleKeyAbstract.open();
                                     }
 
@@ -172,7 +183,18 @@ public Tuple2<KEY, RowData> map(RowData value) {
 
                                 private transient KeyProjectedRow keyProjectedRow;
 
-                                @Override
+                                /**
+                                 * Do not annotate with <code>@override</code> here to maintain
+                                 * compatibility with Flink 1.18-.
+                                 */
+                                public void open(OpenContext openContext) {
+                                    open(new Configuration());
+                                }
+
+                                /**
+                                 * Do not annotate with <code>@override</code> here to maintain
+                                 * compatibility with Flink 2.0+.
+                                 */
                                 public void open(Configuration parameters) {
                                     keyProjectedRow = new KeyProjectedRow(valueProjectionMap);
                                 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
index d306c7d8e1e5f..e768c717ddaa1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
@@ -26,6 +26,7 @@
 import org.apache.paimon.table.source.EndOfScanException;
 import org.apache.paimon.utils.Preconditions;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.connector.source.Boundedness;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
@@ -72,7 +73,16 @@ public BucketUnawareCompactSource(
         this.filter = filter;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         compactionCoordinator =
                 new UnawareAppendTableCompactionCoordinator(table, streaming, filter);
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java
index cee6081aa29f1..2157be51aee4d 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java
@@ -25,6 +25,7 @@
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.table.source.Split;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.connector.source.Boundedness;
@@ -62,7 +63,16 @@ public CombinedAwareBatchSourceFunction(
         super(catalogLoader, includingPattern, excludingPattern, databasePattern, false);
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         super.open(parameters);
         tableScan =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java
index bff690ea30c23..01e0127e9fda7 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java
@@ -25,6 +25,7 @@
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.table.source.Split;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.connector.source.Boundedness;
@@ -59,7 +60,16 @@ public CombinedAwareStreamingSourceFunction(
         this.monitorInterval = monitorInterval;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         super.open(parameters);
         tableScan =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java
index 1964927b5cddc..02bb8786505db 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.table.source.Split;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
 
@@ -70,7 +71,16 @@ public CombinedCompactorSourceFunction(
         this.isStreaming = isStreaming;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         isRunning = new AtomicBoolean(true);
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java
index 8ec8d5f2c1a2e..6a40f10ada615 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java
@@ -29,6 +29,7 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.connector.source.Boundedness;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.datastream.DataStream;
@@ -69,7 +70,16 @@ public CombinedUnawareBatchSourceFunction(
         super(catalogLoader, includingPattern, excludingPattern, databasePattern, false);
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         super.open(parameters);
         tableScan =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java
index e398e09a84518..b64518a7ef60a 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.flink.compact.MultiUnawareBucketTableScan;
 import org.apache.paimon.flink.sink.MultiTableCompactionTaskTypeInfo;
 
+import org.apache.flink.api.common.functions.OpenContext;
 import org.apache.flink.api.connector.source.Boundedness;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.streaming.api.datastream.DataStream;
@@ -55,7 +56,16 @@ public CombinedUnawareStreamingSourceFunction(
         this.monitorInterval = monitorInterval;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public void open(OpenContext openContext) throws Exception {
+        open(new Configuration());
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public void open(Configuration parameters) throws Exception {
         super.open(parameters);
         tableScan =

From ca4af649cf27f4d280c005cc77bee9c860d50bb1 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 25 Nov 2024 20:11:46 +0800
Subject: [PATCH 059/157] [flink] Adopt getTaskInfo() when acquiring
 parallelism info (#4583)

---
 .../flink/utils/RuntimeContextUtils.java      | 32 +++++++++++++++++++
 .../flink/utils/RuntimeContextUtils.java      | 32 +++++++++++++++++++
 .../flink/utils/RuntimeContextUtils.java      | 32 +++++++++++++++++++
 .../flink/utils/RuntimeContextUtils.java      | 32 +++++++++++++++++++
 .../flink/service/QueryExecutorOperator.java  | 10 +++---
 .../paimon/flink/sink/CommitterOperator.java  |  5 ++-
 .../sink/HashBucketAssignerOperator.java      |  5 +--
 .../sink/MultiTablesStoreCompactOperator.java |  7 ++--
 .../flink/sink/StoreCompactOperator.java      |  7 ++--
 .../paimon/flink/sink/TableWriteOperator.java |  5 +--
 .../index/GlobalIndexAssignerOperator.java    |  5 +--
 .../sink/index/IndexBootstrapOperator.java    |  5 +--
 .../paimon/flink/sorter/SortOperator.java     |  4 ++-
 .../AppendBypassCoordinateOperator.java       |  3 +-
 .../source/BucketUnawareCompactSource.java    |  3 +-
 .../flink/utils/RuntimeContextUtils.java      | 32 +++++++++++++++++++
 .../UnawareBucketAppendOnlyTableITCase.java   |  3 +-
 17 files changed, 201 insertions(+), 21 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java

diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
new file mode 100644
index 0000000000000..460fea55ad7a3
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
@@ -0,0 +1,32 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.api.common.functions.RuntimeContext;
+
+/** Utility methods about Flink runtime context to resolve compatibility issues. */
+public class RuntimeContextUtils {
+    public static int getNumberOfParallelSubtasks(RuntimeContext context) {
+        return context.getNumberOfParallelSubtasks();
+    }
+
+    public static int getIndexOfThisSubtask(RuntimeContext context) {
+        return context.getIndexOfThisSubtask();
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
new file mode 100644
index 0000000000000..460fea55ad7a3
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
@@ -0,0 +1,32 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.api.common.functions.RuntimeContext;
+
+/** Utility methods about Flink runtime context to resolve compatibility issues. */
+public class RuntimeContextUtils {
+    public static int getNumberOfParallelSubtasks(RuntimeContext context) {
+        return context.getNumberOfParallelSubtasks();
+    }
+
+    public static int getIndexOfThisSubtask(RuntimeContext context) {
+        return context.getIndexOfThisSubtask();
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
new file mode 100644
index 0000000000000..460fea55ad7a3
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
@@ -0,0 +1,32 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.api.common.functions.RuntimeContext;
+
+/** Utility methods about Flink runtime context to resolve compatibility issues. */
+public class RuntimeContextUtils {
+    public static int getNumberOfParallelSubtasks(RuntimeContext context) {
+        return context.getNumberOfParallelSubtasks();
+    }
+
+    public static int getIndexOfThisSubtask(RuntimeContext context) {
+        return context.getIndexOfThisSubtask();
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
new file mode 100644
index 0000000000000..460fea55ad7a3
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
@@ -0,0 +1,32 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.api.common.functions.RuntimeContext;
+
+/** Utility methods about Flink runtime context to resolve compatibility issues. */
+public class RuntimeContextUtils {
+    public static int getNumberOfParallelSubtasks(RuntimeContext context) {
+        return context.getNumberOfParallelSubtasks();
+    }
+
+    public static int getIndexOfThisSubtask(RuntimeContext context) {
+        return context.getIndexOfThisSubtask();
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryExecutorOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryExecutorOperator.java
index 556c308396884..bf0521d55049c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryExecutorOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryExecutorOperator.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.disk.IOManager;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.DataFileMetaSerializer;
 import org.apache.paimon.service.network.NetworkUtils;
@@ -77,8 +78,8 @@ public void initializeState(StateInitializationContext context) throws Exception
         this.query = ((FileStoreTable) table).newLocalTableQuery().withIOManager(ioManager);
         KvQueryServer server =
                 new KvQueryServer(
-                        getRuntimeContext().getIndexOfThisSubtask(),
-                        getRuntimeContext().getNumberOfParallelSubtasks(),
+                        RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext()),
+                        RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()),
                         NetworkUtils.findHostAddress(),
                         Collections.singletonList(0).iterator(),
                         1,
@@ -96,8 +97,9 @@ public void initializeState(StateInitializationContext context) throws Exception
         this.output.collect(
                 new StreamRecord<>(
                         GenericRow.of(
-                                getRuntimeContext().getNumberOfParallelSubtasks(),
-                                getRuntimeContext().getIndexOfThisSubtask(),
+                                RuntimeContextUtils.getNumberOfParallelSubtasks(
+                                        getRuntimeContext()),
+                                RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext()),
                                 BinaryString.fromString(address.getHostName()),
                                 address.getPort())));
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
index 2ec90b8c6c40c..021a5db413d54 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.flink.sink;
 
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.utils.Preconditions;
 
 import org.apache.flink.runtime.state.StateInitializationContext;
@@ -129,7 +130,9 @@ public void initializeState(StateInitializationContext context) throws Exception
         super.initializeState(context);
 
         Preconditions.checkArgument(
-                !forceSingleParallelism || getRuntimeContext().getNumberOfParallelSubtasks() == 1,
+                !forceSingleParallelism
+                        || RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext())
+                                == 1,
                 "Committer Operator parallelism in paimon MUST be one.");
 
         this.currentWatermark = Long.MIN_VALUE;
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/HashBucketAssignerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/HashBucketAssignerOperator.java
index 70fac7a83e93c..0c101c6d1e01f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/HashBucketAssignerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/HashBucketAssignerOperator.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.flink.sink;
 
 import org.apache.paimon.flink.ProcessRecordAttributesUtil;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.index.BucketAssigner;
 import org.apache.paimon.index.HashBucketAssigner;
 import org.apache.paimon.index.SimpleHashBucketAssigner;
@@ -76,8 +77,8 @@ public void initializeState(StateInitializationContext context) throws Exception
                 StateUtils.getSingleValueFromState(
                         context, "commit_user_state", String.class, initialCommitUser);
 
-        int numberTasks = getRuntimeContext().getNumberOfParallelSubtasks();
-        int taskId = getRuntimeContext().getIndexOfThisSubtask();
+        int numberTasks = RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext());
+        int taskId = RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext());
         long targetRowNum = table.coreOptions().dynamicBucketTargetRowNum();
         this.assigner =
                 overwrite
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
index 7cb5d30c2f8ed..8a1d3a02df811 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.DataFileMetaSerializer;
 import org.apache.paimon.options.Options;
@@ -109,8 +110,10 @@ public void initializeState(StateInitializationContext context) throws Exception
                                 ChannelComputer.select(
                                                 partition,
                                                 bucket,
-                                                getRuntimeContext().getNumberOfParallelSubtasks())
-                                        == getRuntimeContext().getIndexOfThisSubtask());
+                                                RuntimeContextUtils.getNumberOfParallelSubtasks(
+                                                        getRuntimeContext()))
+                                        == RuntimeContextUtils.getIndexOfThisSubtask(
+                                                getRuntimeContext()));
 
         tables = new HashMap<>();
         writes = new HashMap<>();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
index 9b152a81ca225..ac10345bc4257 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.DataFileMetaSerializer;
 import org.apache.paimon.options.Options;
@@ -92,8 +93,10 @@ public void initializeState(StateInitializationContext context) throws Exception
                                 ChannelComputer.select(
                                                 partition,
                                                 bucket,
-                                                getRuntimeContext().getNumberOfParallelSubtasks())
-                                        == getRuntimeContext().getIndexOfThisSubtask());
+                                                RuntimeContextUtils.getNumberOfParallelSubtasks(
+                                                        getRuntimeContext()))
+                                        == RuntimeContextUtils.getIndexOfThisSubtask(
+                                                getRuntimeContext()));
         write =
                 storeSinkWriteProvider.provide(
                         table,
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
index 67b4720e29645..32fcdd03bdfd5 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.flink.ProcessRecordAttributesUtil;
 import org.apache.paimon.flink.sink.StoreSinkWriteState.StateValueFilter;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.sink.ChannelComputer;
@@ -58,14 +59,14 @@ public void initializeState(StateInitializationContext context) throws Exception
         super.initializeState(context);
 
         boolean containLogSystem = containLogSystem();
-        int numTasks = getRuntimeContext().getNumberOfParallelSubtasks();
+        int numTasks = RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext());
         StateValueFilter stateFilter =
                 (tableName, partition, bucket) -> {
                     int task =
                             containLogSystem
                                     ? ChannelComputer.select(bucket, numTasks)
                                     : ChannelComputer.select(partition, bucket, numTasks);
-                    return task == getRuntimeContext().getIndexOfThisSubtask();
+                    return task == RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext());
                 };
 
         state = createState(context, stateFilter);
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalIndexAssignerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalIndexAssignerOperator.java
index 7fee3f45f3db7..99cce07fdc574 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalIndexAssignerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalIndexAssignerOperator.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.crosspartition.KeyPartOrRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.disk.IOManager;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.table.Table;
 
 import org.apache.flink.api.java.tuple.Tuple2;
@@ -59,8 +60,8 @@ public void initializeState(StateInitializationContext context) throws Exception
         assigner.open(
                 computeManagedMemory(this),
                 ioManager,
-                getRuntimeContext().getNumberOfParallelSubtasks(),
-                getRuntimeContext().getIndexOfThisSubtask(),
+                RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()),
+                RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext()),
                 this::collect);
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
index 501e35dff46cb..5c8ba8f9441f3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.crosspartition.IndexBootstrap;
 import org.apache.paimon.crosspartition.KeyPartOrRow;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.utils.SerializableFunction;
 
 import org.apache.flink.api.java.tuple.Tuple2;
@@ -50,8 +51,8 @@ public IndexBootstrapOperator(
     public void initializeState(StateInitializationContext context) throws Exception {
         super.initializeState(context);
         bootstrap.bootstrap(
-                getRuntimeContext().getNumberOfParallelSubtasks(),
-                getRuntimeContext().getIndexOfThisSubtask(),
+                RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()),
+                RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext()),
                 this::collect);
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortOperator.java
index d4d5dd7416816..b6847125fbc66 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sorter/SortOperator.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.data.BinaryRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.disk.IOManager;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.options.MemorySize;
 import org.apache.paimon.sort.BinaryExternalSortBuffer;
 import org.apache.paimon.types.RowType;
@@ -79,7 +80,8 @@ public SortOperator(
     public void open() throws Exception {
         super.open();
         initBuffer();
-        if (sinkParallelism != getRuntimeContext().getNumberOfParallelSubtasks()) {
+        if (sinkParallelism
+                != RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext())) {
             throw new IllegalArgumentException(
                     "Please ensure that the runtime parallelism of the sink matches the initial configuration "
                             + "to avoid potential issues with skewed range partitioning.");
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
index 668aa24c145d7..45090f7b68b40 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.append.UnawareAppendCompactionTask;
 import org.apache.paimon.append.UnawareAppendTableCompactionCoordinator;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.utils.ExecutorUtils;
 
@@ -67,7 +68,7 @@ public AppendBypassCoordinateOperator(
     public void open() throws Exception {
         super.open();
         checkArgument(
-                getRuntimeContext().getNumberOfParallelSubtasks() == 1,
+                RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()) == 1,
                 "Compaction Coordinator parallelism in paimon MUST be one.");
         long intervalMs = table.coreOptions().continuousDiscoveryInterval().toMillis();
         this.compactTasks = new LinkedBlockingQueue<>();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
index e768c717ddaa1..79ee827fe6e41 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.append.UnawareAppendCompactionTask;
 import org.apache.paimon.append.UnawareAppendTableCompactionCoordinator;
 import org.apache.paimon.flink.sink.CompactionTaskTypeInfo;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.source.EndOfScanException;
@@ -87,7 +88,7 @@ public void open(Configuration parameters) throws Exception {
         compactionCoordinator =
                 new UnawareAppendTableCompactionCoordinator(table, streaming, filter);
         Preconditions.checkArgument(
-                this.getRuntimeContext().getNumberOfParallelSubtasks() == 1,
+                RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()) == 1,
                 "Compaction Operator parallelism in paimon MUST be one.");
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
new file mode 100644
index 0000000000000..34e0d041b6a0c
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/RuntimeContextUtils.java
@@ -0,0 +1,32 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.api.common.functions.RuntimeContext;
+
+/** Utility methods about Flink runtime context to resolve compatibility issues. */
+public class RuntimeContextUtils {
+    public static int getNumberOfParallelSubtasks(RuntimeContext context) {
+        return context.getTaskInfo().getNumberOfParallelSubtasks();
+    }
+
+    public static int getIndexOfThisSubtask(RuntimeContext context) {
+        return context.getTaskInfo().getIndexOfThisSubtask();
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
index cb323542d4c11..f6dfb1b23046b 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.reader.RecordReader;
@@ -395,7 +396,7 @@ private TestStatelessWriterSource(FileStoreTable table) {
 
         @Override
         public void run(SourceContext<Integer> sourceContext) throws Exception {
-            int taskId = getRuntimeContext().getIndexOfThisSubtask();
+            int taskId = RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext());
             // wait some time in parallelism #2,
             // so that it does not commit in the same checkpoint with parallelism #1
             int waitCount = (taskId == 0 ? 0 : 10);

From 8d57d3d90a945c8705d3acda3e7bf0ef2cb157ef Mon Sep 17 00:00:00 2001
From: wangwj <hongli.wwj@gmail.com>
Date: Tue, 26 Nov 2024 13:02:01 +0800
Subject: [PATCH 060/157] [core] add deletedFileTotalSizeInBytes in result of
 OrphanFilesClean (#4545)

---
 .../operation/CleanOrphanFilesResult.java     | 54 ++++++++++
 .../operation/LocalOrphanFilesClean.java      | 64 +++++++-----
 .../paimon/operation/OrphanFilesClean.java    | 38 +++++--
 .../apache/paimon/utils/SnapshotManager.java  | 10 +-
 .../operation/LocalOrphanFilesCleanTest.java  | 18 ++--
 .../procedure/RemoveOrphanFilesProcedure.java | 13 ++-
 .../flink/RemoveOrphanFilesActionITCase.java  |  2 +-
 .../flink/orphan/FlinkOrphanFilesClean.java   | 98 +++++++++++++------
 .../procedure/RemoveOrphanFilesProcedure.java | 12 ++-
 .../RemoveOrphanFilesActionITCaseBase.java    |  2 +-
 .../procedure/RemoveOrphanFilesProcedure.java | 18 +++-
 .../spark/orphan/SparkOrphanFilesClean.scala  | 64 +++++++-----
 .../RemoveOrphanFilesProcedureTest.scala      | 30 +++---
 13 files changed, 291 insertions(+), 132 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java b/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java
new file mode 100644
index 0000000000000..5a3bc67f9c95e
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.operation;
+
+import org.apache.paimon.fs.Path;
+
+import java.util.List;
+
+/** The result of OrphanFilesClean. */
+public class CleanOrphanFilesResult {
+
+    private List<Path> deletedFilesPath;
+    private final long deletedFileCount;
+    private final long deletedFileTotalLenInBytes;
+
+    public CleanOrphanFilesResult(long deletedFileCount, long deletedFileTotalLenInBytes) {
+        this.deletedFileCount = deletedFileCount;
+        this.deletedFileTotalLenInBytes = deletedFileTotalLenInBytes;
+    }
+
+    public CleanOrphanFilesResult(
+            List<Path> deletedFilesPath, long deletedFileCount, long deletedFileTotalLenInBytes) {
+        this(deletedFileCount, deletedFileTotalLenInBytes);
+        this.deletedFilesPath = deletedFilesPath;
+    }
+
+    public long getDeletedFileCount() {
+        return deletedFileCount;
+    }
+
+    public long getDeletedFileTotalLenInBytes() {
+        return deletedFileTotalLenInBytes;
+    }
+
+    public List<Path> getDeletedFilesPath() {
+        return deletedFilesPath;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
index a5eea6d650cf9..511c5fc7fb79b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
@@ -21,12 +21,12 @@
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.Identifier;
-import org.apache.paimon.fs.FileStatus;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
+import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.SerializableConsumer;
 
 import javax.annotation.Nullable;
@@ -47,6 +47,7 @@
 import java.util.concurrent.Future;
 import java.util.concurrent.ThreadPoolExecutor;
 import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicLong;
 import java.util.function.Consumer;
 import java.util.function.Function;
 import java.util.stream.Collectors;
@@ -68,6 +69,8 @@ public class LocalOrphanFilesClean extends OrphanFilesClean {
 
     private final List<Path> deleteFiles;
 
+    private final AtomicLong deletedFilesLenInBytes = new AtomicLong(0);
+
     private Set<String> candidateDeletes;
 
     public LocalOrphanFilesClean(FileStoreTable table) {
@@ -87,16 +90,18 @@ public LocalOrphanFilesClean(
                         table.coreOptions().deleteFileThreadNum(), "ORPHAN_FILES_CLEAN");
     }
 
-    public List<Path> clean() throws IOException, ExecutionException, InterruptedException {
+    public CleanOrphanFilesResult clean()
+            throws IOException, ExecutionException, InterruptedException {
         List<String> branches = validBranches();
 
         // specially handle to clear snapshot dir
-        cleanSnapshotDir(branches, deleteFiles::add);
+        cleanSnapshotDir(branches, deleteFiles::add, deletedFilesLenInBytes::addAndGet);
 
         // delete candidate files
-        Map<String, Path> candidates = getCandidateDeletingFiles();
+        Map<String, Pair<Path, Long>> candidates = getCandidateDeletingFiles();
         if (candidates.isEmpty()) {
-            return deleteFiles;
+            return new CleanOrphanFilesResult(
+                    deleteFiles, deleteFiles.size(), deletedFilesLenInBytes.get());
         }
         candidateDeletes = new HashSet<>(candidates.keySet());
 
@@ -108,12 +113,22 @@ public List<Path> clean() throws IOException, ExecutionException, InterruptedExc
 
         // delete unused files
         candidateDeletes.removeAll(usedFiles);
-        candidateDeletes.stream().map(candidates::get).forEach(fileCleaner);
+        candidateDeletes.stream()
+                .map(candidates::get)
+                .forEach(
+                        deleteFileInfo -> {
+                            deletedFilesLenInBytes.addAndGet(deleteFileInfo.getRight());
+                            fileCleaner.accept(deleteFileInfo.getLeft());
+                        });
         deleteFiles.addAll(
-                candidateDeletes.stream().map(candidates::get).collect(Collectors.toList()));
+                candidateDeletes.stream()
+                        .map(candidates::get)
+                        .map(Pair::getLeft)
+                        .collect(Collectors.toList()));
         candidateDeletes.clear();
 
-        return deleteFiles;
+        return new CleanOrphanFilesResult(
+                deleteFiles, deleteFiles.size(), deletedFilesLenInBytes.get());
     }
 
     private void collectWithoutDataFile(
@@ -172,19 +187,20 @@ private Set<String> getUsedFiles(String branch) {
      * Get all the candidate deleting files in the specified directories and filter them by
      * olderThanMillis.
      */
-    private Map<String, Path> getCandidateDeletingFiles() {
+    private Map<String, Pair<Path, Long>> getCandidateDeletingFiles() {
         List<Path> fileDirs = listPaimonFileDirs();
-        Function<Path, List<Path>> processor =
+        Function<Path, List<Pair<Path, Long>>> processor =
                 path ->
                         tryBestListingDirs(path).stream()
                                 .filter(this::oldEnough)
-                                .map(FileStatus::getPath)
+                                .map(status -> Pair.of(status.getPath(), status.getLen()))
                                 .collect(Collectors.toList());
-        Iterator<Path> allPaths = randomlyExecuteSequentialReturn(executor, processor, fileDirs);
-        Map<String, Path> result = new HashMap<>();
-        while (allPaths.hasNext()) {
-            Path next = allPaths.next();
-            result.put(next.getName(), next);
+        Iterator<Pair<Path, Long>> allFilesInfo =
+                randomlyExecuteSequentialReturn(executor, processor, fileDirs);
+        Map<String, Pair<Path, Long>> result = new HashMap<>();
+        while (allFilesInfo.hasNext()) {
+            Pair<Path, Long> fileInfo = allFilesInfo.next();
+            result.put(fileInfo.getLeft().getName(), fileInfo);
         }
         return result;
     }
@@ -197,7 +213,6 @@ public static List<LocalOrphanFilesClean> createOrphanFilesCleans(
             SerializableConsumer<Path> fileCleaner,
             @Nullable Integer parallelism)
             throws Catalog.DatabaseNotExistException, Catalog.TableNotExistException {
-        List<LocalOrphanFilesClean> orphanFilesCleans = new ArrayList<>();
         List<String> tableNames = Collections.singletonList(tableName);
         if (tableName == null || "*".equals(tableName)) {
             tableNames = catalog.listTables(databaseName);
@@ -214,6 +229,7 @@ public static List<LocalOrphanFilesClean> createOrphanFilesCleans(
                             }
                         };
 
+        List<LocalOrphanFilesClean> orphanFilesCleans = new ArrayList<>(tableNames.size());
         for (String t : tableNames) {
             Identifier identifier = new Identifier(databaseName, t);
             Table table = catalog.getTable(identifier).copy(dynamicOptions);
@@ -230,7 +246,7 @@ public static List<LocalOrphanFilesClean> createOrphanFilesCleans(
         return orphanFilesCleans;
     }
 
-    public static long executeDatabaseOrphanFiles(
+    public static CleanOrphanFilesResult executeDatabaseOrphanFiles(
             Catalog catalog,
             String databaseName,
             @Nullable String tableName,
@@ -249,15 +265,17 @@ public static long executeDatabaseOrphanFiles(
 
         ExecutorService executorService =
                 Executors.newFixedThreadPool(Runtime.getRuntime().availableProcessors());
-        List<Future<List<Path>>> tasks = new ArrayList<>();
+        List<Future<CleanOrphanFilesResult>> tasks = new ArrayList<>(tableCleans.size());
         for (LocalOrphanFilesClean clean : tableCleans) {
             tasks.add(executorService.submit(clean::clean));
         }
 
-        List<Path> cleanOrphanFiles = new ArrayList<>();
-        for (Future<List<Path>> task : tasks) {
+        long deletedFileCount = 0;
+        long deletedFileTotalLenInBytes = 0;
+        for (Future<CleanOrphanFilesResult> task : tasks) {
             try {
-                cleanOrphanFiles.addAll(task.get());
+                deletedFileCount += task.get().getDeletedFileCount();
+                deletedFileTotalLenInBytes += task.get().getDeletedFileTotalLenInBytes();
             } catch (InterruptedException e) {
                 Thread.currentThread().interrupt();
                 throw new RuntimeException(e);
@@ -267,6 +285,6 @@ public static long executeDatabaseOrphanFiles(
         }
 
         executorService.shutdownNow();
-        return cleanOrphanFiles.size();
+        return new CleanOrphanFilesResult(deletedFileCount, deletedFileTotalLenInBytes);
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java b/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
index 869100d9cfb8d..274cdd52fe140 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/OrphanFilesClean.java
@@ -120,23 +120,47 @@ protected List<String> validBranches() {
         return branches;
     }
 
-    protected void cleanSnapshotDir(List<String> branches, Consumer<Path> deletedFileConsumer) {
+    protected void cleanSnapshotDir(
+            List<String> branches,
+            Consumer<Path> deletedFilesConsumer,
+            Consumer<Long> deletedFilesLenInBytesConsumer) {
         for (String branch : branches) {
             FileStoreTable branchTable = table.switchToBranch(branch);
             SnapshotManager snapshotManager = branchTable.snapshotManager();
 
             // specially handle the snapshot directory
-            List<Path> nonSnapshotFiles = snapshotManager.tryGetNonSnapshotFiles(this::oldEnough);
-            nonSnapshotFiles.forEach(fileCleaner);
-            nonSnapshotFiles.forEach(deletedFileConsumer);
+            List<Pair<Path, Long>> nonSnapshotFiles =
+                    snapshotManager.tryGetNonSnapshotFiles(this::oldEnough);
+            nonSnapshotFiles.forEach(
+                    nonSnapshotFile ->
+                            cleanFile(
+                                    nonSnapshotFile,
+                                    deletedFilesConsumer,
+                                    deletedFilesLenInBytesConsumer));
 
             // specially handle the changelog directory
-            List<Path> nonChangelogFiles = snapshotManager.tryGetNonChangelogFiles(this::oldEnough);
-            nonChangelogFiles.forEach(fileCleaner);
-            nonChangelogFiles.forEach(deletedFileConsumer);
+            List<Pair<Path, Long>> nonChangelogFiles =
+                    snapshotManager.tryGetNonChangelogFiles(this::oldEnough);
+            nonChangelogFiles.forEach(
+                    nonChangelogFile ->
+                            cleanFile(
+                                    nonChangelogFile,
+                                    deletedFilesConsumer,
+                                    deletedFilesLenInBytesConsumer));
         }
     }
 
+    private void cleanFile(
+            Pair<Path, Long> deleteFileInfo,
+            Consumer<Path> deletedFilesConsumer,
+            Consumer<Long> deletedFilesLenInBytesConsumer) {
+        Path filePath = deleteFileInfo.getLeft();
+        Long fileSize = deleteFileInfo.getRight();
+        deletedFilesConsumer.accept(filePath);
+        deletedFilesLenInBytesConsumer.accept(fileSize);
+        fileCleaner.accept(filePath);
+    }
+
     protected Set<Snapshot> safelyGetAllSnapshots(String branch) throws IOException {
         FileStoreTable branchTable = table.switchToBranch(branch);
         SnapshotManager snapshotManager = branchTable.snapshotManager();
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
index 9a120042eaaad..cbe33ffaf4569 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
@@ -563,15 +563,15 @@ private void collectSnapshots(Consumer<Path> pathConsumer, List<Path> paths)
      * Try to get non snapshot files. If any error occurred, just ignore it and return an empty
      * result.
      */
-    public List<Path> tryGetNonSnapshotFiles(Predicate<FileStatus> fileStatusFilter) {
+    public List<Pair<Path, Long>> tryGetNonSnapshotFiles(Predicate<FileStatus> fileStatusFilter) {
         return listPathWithFilter(snapshotDirectory(), fileStatusFilter, nonSnapshotFileFilter());
     }
 
-    public List<Path> tryGetNonChangelogFiles(Predicate<FileStatus> fileStatusFilter) {
+    public List<Pair<Path, Long>> tryGetNonChangelogFiles(Predicate<FileStatus> fileStatusFilter) {
         return listPathWithFilter(changelogDirectory(), fileStatusFilter, nonChangelogFileFilter());
     }
 
-    private List<Path> listPathWithFilter(
+    private List<Pair<Path, Long>> listPathWithFilter(
             Path directory, Predicate<FileStatus> fileStatusFilter, Predicate<Path> fileFilter) {
         try {
             FileStatus[] statuses = fileIO.listStatus(directory);
@@ -581,8 +581,8 @@ private List<Path> listPathWithFilter(
 
             return Arrays.stream(statuses)
                     .filter(fileStatusFilter)
-                    .map(FileStatus::getPath)
-                    .filter(fileFilter)
+                    .filter(status -> fileFilter.test(status.getPath()))
+                    .map(status -> Pair.of(status.getPath(), status.getLen()))
                     .collect(Collectors.toList());
         } catch (IOException ignored) {
             return Collections.emptyList();
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/LocalOrphanFilesCleanTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/LocalOrphanFilesCleanTest.java
index fdc68b34abb44..5139dd44957d7 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/LocalOrphanFilesCleanTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/LocalOrphanFilesCleanTest.java
@@ -165,22 +165,20 @@ public void testNormallyRemoving() throws Throwable {
 
         // randomly delete tags
         List<String> deleteTags = Collections.emptyList();
-        if (!allTags.isEmpty()) {
-            deleteTags = randomlyPick(allTags);
-            for (String tagName : deleteTags) {
-                table.deleteTag(tagName);
-            }
+        deleteTags = randomlyPick(allTags);
+        for (String tagName : deleteTags) {
+            table.deleteTag(tagName);
         }
 
         // first check, nothing will be deleted because the default olderThan interval is 1 day
         LocalOrphanFilesClean orphanFilesClean = new LocalOrphanFilesClean(table);
-        assertThat(orphanFilesClean.clean().size()).isEqualTo(0);
+        assertThat(orphanFilesClean.clean().getDeletedFilesPath().size()).isEqualTo(0);
 
         // second check
         orphanFilesClean =
                 new LocalOrphanFilesClean(
                         table, System.currentTimeMillis() + TimeUnit.SECONDS.toMillis(2));
-        List<Path> deleted = orphanFilesClean.clean();
+        List<Path> deleted = orphanFilesClean.clean().getDeletedFilesPath();
         try {
             validate(deleted, snapshotData, new HashMap<>());
         } catch (Throwable t) {
@@ -363,13 +361,13 @@ public void testCleanOrphanFilesWithChangelogDecoupled(String changelogProducer)
 
         // first check, nothing will be deleted because the default olderThan interval is 1 day
         LocalOrphanFilesClean orphanFilesClean = new LocalOrphanFilesClean(table);
-        assertThat(orphanFilesClean.clean().size()).isEqualTo(0);
+        assertThat(orphanFilesClean.clean().getDeletedFilesPath().size()).isEqualTo(0);
 
         // second check
         orphanFilesClean =
                 new LocalOrphanFilesClean(
                         table, System.currentTimeMillis() + TimeUnit.SECONDS.toMillis(2));
-        List<Path> deleted = orphanFilesClean.clean();
+        List<Path> deleted = orphanFilesClean.clean().getDeletedFilesPath();
         validate(deleted, snapshotData, changelogData);
     }
 
@@ -399,7 +397,7 @@ public void testAbnormallyRemoving() throws Exception {
         LocalOrphanFilesClean orphanFilesClean =
                 new LocalOrphanFilesClean(
                         table, System.currentTimeMillis() + TimeUnit.SECONDS.toMillis(2));
-        assertThat(orphanFilesClean.clean().size()).isGreaterThan(0);
+        assertThat(orphanFilesClean.clean().getDeletedFilesPath().size()).isGreaterThan(0);
     }
 
     private void writeData(
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
index 7695c510b1dc7..b4a3a6b359d91 100644
--- a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.flink.orphan.FlinkOrphanFilesClean;
+import org.apache.paimon.operation.CleanOrphanFilesResult;
 import org.apache.paimon.operation.LocalOrphanFilesClean;
 
 import org.apache.flink.table.procedure.ProcedureContext;
@@ -86,11 +87,12 @@ public String[] call(
         if (mode == null) {
             mode = "DISTRIBUTED";
         }
-        long deletedFiles;
+
+        CleanOrphanFilesResult cleanOrphanFilesResult;
         try {
             switch (mode.toUpperCase(Locale.ROOT)) {
                 case "DISTRIBUTED":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             FlinkOrphanFilesClean.executeDatabaseOrphanFiles(
                                     procedureContext.getExecutionEnvironment(),
                                     catalog,
@@ -101,7 +103,7 @@ public String[] call(
                                     tableName);
                     break;
                 case "LOCAL":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             LocalOrphanFilesClean.executeDatabaseOrphanFiles(
                                     catalog,
                                     databaseName,
@@ -116,7 +118,10 @@ public String[] call(
                                     + mode
                                     + ". Only 'DISTRIBUTED' and 'LOCAL' are supported.");
             }
-            return new String[] {String.valueOf(deletedFiles)};
+            return new String[] {
+                String.valueOf(cleanOrphanFilesResult.getDeletedFileCount()),
+                String.valueOf(cleanOrphanFilesResult.getDeletedFileTotalLenInBytes())
+            };
         } catch (Exception e) {
             throw new RuntimeException(e);
         }
diff --git a/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
index 46b62b6bf3072..a168c3785c7c2 100644
--- a/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
+++ b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/RemoveOrphanFilesActionITCase.java
@@ -137,7 +137,7 @@ public void testRunWithoutException() throws Exception {
                         database, tableName);
         ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
 
-        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"));
+        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"), Row.of("2"));
     }
 
     @Test
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
index 61bebca24af45..23bbbc9b609ca 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/orphan/FlinkOrphanFilesClean.java
@@ -27,12 +27,15 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
+import org.apache.paimon.operation.CleanOrphanFilesResult;
 import org.apache.paimon.operation.OrphanFilesClean;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
+import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.SerializableConsumer;
 
 import org.apache.flink.api.common.RuntimeExecutionMode;
+import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.configuration.CoreOptions;
@@ -61,7 +64,6 @@
 import java.util.function.Consumer;
 import java.util.stream.Collectors;
 
-import static org.apache.flink.api.common.typeinfo.BasicTypeInfo.LONG_TYPE_INFO;
 import static org.apache.flink.api.common.typeinfo.BasicTypeInfo.STRING_TYPE_INFO;
 import static org.apache.flink.util.Preconditions.checkState;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
@@ -81,7 +83,7 @@ public FlinkOrphanFilesClean(
     }
 
     @Nullable
-    public DataStream<Long> doOrphanClean(StreamExecutionEnvironment env) {
+    public DataStream<CleanOrphanFilesResult> doOrphanClean(StreamExecutionEnvironment env) {
         Configuration flinkConf = new Configuration();
         flinkConf.set(ExecutionOptions.RUNTIME_MODE, RuntimeExecutionMode.BATCH);
         flinkConf.set(ExecutionOptions.SORT_INPUTS, false);
@@ -97,8 +99,12 @@ public DataStream<Long> doOrphanClean(StreamExecutionEnvironment env) {
 
         // snapshot and changelog files are the root of everything, so they are handled specially
         // here, and subsequently, we will not count their orphan files.
-        AtomicLong deletedInLocal = new AtomicLong(0);
-        cleanSnapshotDir(branches, p -> deletedInLocal.incrementAndGet());
+        AtomicLong deletedFilesCountInLocal = new AtomicLong(0);
+        AtomicLong deletedFilesLenInBytesInLocal = new AtomicLong(0);
+        cleanSnapshotDir(
+                branches,
+                path -> deletedFilesCountInLocal.incrementAndGet(),
+                deletedFilesLenInBytesInLocal::addAndGet);
 
         // branch and manifest file
         final OutputTag<Tuple2<String, String>> manifestOutputTag =
@@ -203,36 +209,45 @@ public void endInput() throws IOException {
                         .map(Path::toUri)
                         .map(Object::toString)
                         .collect(Collectors.toList());
-        DataStream<String> candidates =
+        DataStream<Pair<String, Long>> candidates =
                 env.fromCollection(fileDirs)
                         .process(
-                                new ProcessFunction<String, String>() {
+                                new ProcessFunction<String, Pair<String, Long>>() {
                                     @Override
                                     public void processElement(
                                             String dir,
-                                            ProcessFunction<String, String>.Context ctx,
-                                            Collector<String> out) {
+                                            ProcessFunction<String, Pair<String, Long>>.Context ctx,
+                                            Collector<Pair<String, Long>> out) {
                                         for (FileStatus fileStatus :
                                                 tryBestListingDirs(new Path(dir))) {
                                             if (oldEnough(fileStatus)) {
                                                 out.collect(
-                                                        fileStatus.getPath().toUri().toString());
+                                                        Pair.of(
+                                                                fileStatus
+                                                                        .getPath()
+                                                                        .toUri()
+                                                                        .toString(),
+                                                                fileStatus.getLen()));
                                             }
                                         }
                                     }
                                 });
 
-        DataStream<Long> deleted =
+        DataStream<CleanOrphanFilesResult> deleted =
                 usedFiles
                         .keyBy(f -> f)
-                        .connect(candidates.keyBy(path -> new Path(path).getName()))
+                        .connect(
+                                candidates.keyBy(
+                                        pathAndSize -> new Path(pathAndSize.getKey()).getName()))
                         .transform(
                                 "files_join",
-                                LONG_TYPE_INFO,
-                                new BoundedTwoInputOperator<String, String, Long>() {
+                                TypeInformation.of(CleanOrphanFilesResult.class),
+                                new BoundedTwoInputOperator<
+                                        String, Pair<String, Long>, CleanOrphanFilesResult>() {
 
                                     private boolean buildEnd;
-                                    private long emitted;
+                                    private long emittedFilesCount;
+                                    private long emittedFilesLen;
 
                                     private final Set<String> used = new HashSet<>();
 
@@ -254,8 +269,15 @@ public void endInput(int inputId) {
                                             case 2:
                                                 checkState(buildEnd, "Should build ended.");
                                                 LOG.info("Finish probe phase.");
-                                                LOG.info("Clean files: {}", emitted);
-                                                output.collect(new StreamRecord<>(emitted));
+                                                LOG.info(
+                                                        "Clean files count : {}",
+                                                        emittedFilesCount);
+                                                LOG.info("Clean files size : {}", emittedFilesLen);
+                                                output.collect(
+                                                        new StreamRecord<>(
+                                                                new CleanOrphanFilesResult(
+                                                                        emittedFilesCount,
+                                                                        emittedFilesLen)));
                                                 break;
                                         }
                                     }
@@ -266,25 +288,34 @@ public void processElement1(StreamRecord<String> element) {
                                     }
 
                                     @Override
-                                    public void processElement2(StreamRecord<String> element) {
+                                    public void processElement2(
+                                            StreamRecord<Pair<String, Long>> element) {
                                         checkState(buildEnd, "Should build ended.");
-                                        String value = element.getValue();
+                                        Pair<String, Long> fileInfo = element.getValue();
+                                        String value = fileInfo.getLeft();
                                         Path path = new Path(value);
                                         if (!used.contains(path.getName())) {
+                                            emittedFilesCount++;
+                                            emittedFilesLen += fileInfo.getRight();
                                             fileCleaner.accept(path);
                                             LOG.info("Dry clean: {}", path);
-                                            emitted++;
                                         }
                                     }
                                 });
 
-        if (deletedInLocal.get() != 0) {
-            deleted = deleted.union(env.fromElements(deletedInLocal.get()));
+        if (deletedFilesCountInLocal.get() != 0 || deletedFilesLenInBytesInLocal.get() != 0) {
+            deleted =
+                    deleted.union(
+                            env.fromElements(
+                                    new CleanOrphanFilesResult(
+                                            deletedFilesCountInLocal.get(),
+                                            deletedFilesLenInBytesInLocal.get())));
         }
+
         return deleted;
     }
 
-    public static long executeDatabaseOrphanFiles(
+    public static CleanOrphanFilesResult executeDatabaseOrphanFiles(
             StreamExecutionEnvironment env,
             Catalog catalog,
             long olderThanMillis,
@@ -293,12 +324,13 @@ public static long executeDatabaseOrphanFiles(
             String databaseName,
             @Nullable String tableName)
             throws Catalog.DatabaseNotExistException, Catalog.TableNotExistException {
-        List<DataStream<Long>> orphanFilesCleans = new ArrayList<>();
         List<String> tableNames = Collections.singletonList(tableName);
         if (tableName == null || "*".equals(tableName)) {
             tableNames = catalog.listTables(databaseName);
         }
 
+        List<DataStream<CleanOrphanFilesResult>> orphanFilesCleans =
+                new ArrayList<>(tableNames.size());
         for (String t : tableNames) {
             Identifier identifier = new Identifier(databaseName, t);
             Table table = catalog.getTable(identifier);
@@ -307,7 +339,7 @@ public static long executeDatabaseOrphanFiles(
                     "Only FileStoreTable supports remove-orphan-files action. The table type is '%s'.",
                     table.getClass().getName());
 
-            DataStream<Long> clean =
+            DataStream<CleanOrphanFilesResult> clean =
                     new FlinkOrphanFilesClean(
                                     (FileStoreTable) table,
                                     olderThanMillis,
@@ -319,8 +351,8 @@ public static long executeDatabaseOrphanFiles(
             }
         }
 
-        DataStream<Long> result = null;
-        for (DataStream<Long> clean : orphanFilesCleans) {
+        DataStream<CleanOrphanFilesResult> result = null;
+        for (DataStream<CleanOrphanFilesResult> clean : orphanFilesCleans) {
             if (result == null) {
                 result = clean;
             } else {
@@ -331,20 +363,24 @@ public static long executeDatabaseOrphanFiles(
         return sum(result);
     }
 
-    private static long sum(DataStream<Long> deleted) {
-        long deleteCount = 0;
+    private static CleanOrphanFilesResult sum(DataStream<CleanOrphanFilesResult> deleted) {
+        long deletedFilesCount = 0;
+        long deletedFilesLenInBytes = 0;
         if (deleted != null) {
             try {
-                CloseableIterator<Long> iterator =
+                CloseableIterator<CleanOrphanFilesResult> iterator =
                         deleted.global().executeAndCollect("OrphanFilesClean");
                 while (iterator.hasNext()) {
-                    deleteCount += iterator.next();
+                    CleanOrphanFilesResult cleanOrphanFilesResult = iterator.next();
+                    deletedFilesCount += cleanOrphanFilesResult.getDeletedFileCount();
+                    deletedFilesLenInBytes +=
+                            cleanOrphanFilesResult.getDeletedFileTotalLenInBytes();
                 }
                 iterator.close();
             } catch (Exception e) {
                 throw new RuntimeException(e);
             }
         }
-        return deleteCount;
+        return new CleanOrphanFilesResult(deletedFilesCount, deletedFilesLenInBytes);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
index 10ad878e0ccb5..4cd1b3e003038 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RemoveOrphanFilesProcedure.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.flink.orphan.FlinkOrphanFilesClean;
+import org.apache.paimon.operation.CleanOrphanFilesResult;
 import org.apache.paimon.operation.LocalOrphanFilesClean;
 
 import org.apache.flink.table.annotation.ArgumentHint;
@@ -75,11 +76,11 @@ public String[] call(
         if (mode == null) {
             mode = "DISTRIBUTED";
         }
-        long deletedFiles;
+        CleanOrphanFilesResult cleanOrphanFilesResult;
         try {
             switch (mode.toUpperCase(Locale.ROOT)) {
                 case "DISTRIBUTED":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             FlinkOrphanFilesClean.executeDatabaseOrphanFiles(
                                     procedureContext.getExecutionEnvironment(),
                                     catalog,
@@ -90,7 +91,7 @@ public String[] call(
                                     tableName);
                     break;
                 case "LOCAL":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             LocalOrphanFilesClean.executeDatabaseOrphanFiles(
                                     catalog,
                                     databaseName,
@@ -105,7 +106,10 @@ public String[] call(
                                     + mode
                                     + ". Only 'DISTRIBUTED' and 'LOCAL' are supported.");
             }
-            return new String[] {String.valueOf(deletedFiles)};
+            return new String[] {
+                String.valueOf(cleanOrphanFilesResult.getDeletedFileCount()),
+                String.valueOf(cleanOrphanFilesResult.getDeletedFileTotalLenInBytes())
+            };
         } catch (Exception e) {
             throw new RuntimeException(e);
         }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java
index 5f874a5a7f9b2..77f3be2f0c765 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/RemoveOrphanFilesActionITCaseBase.java
@@ -148,7 +148,7 @@ public void testRunWithoutException(boolean isNamedArgument) throws Exception {
                         tableName);
         ImmutableList<Row> actualDeleteFile = ImmutableList.copyOf(executeSQL(withOlderThan));
 
-        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"));
+        assertThat(actualDeleteFile).containsExactlyInAnyOrder(Row.of("2"), Row.of("2"));
     }
 
     @ParameterizedTest
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedure.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedure.java
index 293e84ca14bd6..a929641106c69 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedure.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedure.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.spark.procedure;
 
 import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.operation.CleanOrphanFilesResult;
 import org.apache.paimon.operation.LocalOrphanFilesClean;
 import org.apache.paimon.operation.OrphanFilesClean;
 import org.apache.paimon.spark.catalog.WithPaimonCatalog;
@@ -66,7 +67,9 @@ public class RemoveOrphanFilesProcedure extends BaseProcedure {
     private static final StructType OUTPUT_TYPE =
             new StructType(
                     new StructField[] {
-                        new StructField("result", LongType, true, Metadata.empty())
+                        new StructField("deletedFileCount", LongType, true, Metadata.empty()),
+                        new StructField(
+                                "deletedFileTotalLenInBytes", LongType, true, Metadata.empty())
                     });
 
     private RemoveOrphanFilesProcedure(TableCatalog tableCatalog) {
@@ -104,11 +107,11 @@ public InternalRow[] call(InternalRow args) {
         Catalog catalog = ((WithPaimonCatalog) tableCatalog()).paimonCatalog();
         String mode = args.isNullAt(4) ? "DISTRIBUTED" : args.getString(4);
 
-        long deletedFiles;
+        CleanOrphanFilesResult cleanOrphanFilesResult;
         try {
             switch (mode.toUpperCase(Locale.ROOT)) {
                 case "LOCAL":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             LocalOrphanFilesClean.executeDatabaseOrphanFiles(
                                     catalog,
                                     identifier.getDatabaseName(),
@@ -120,7 +123,7 @@ public InternalRow[] call(InternalRow args) {
                                     args.isNullAt(3) ? null : args.getInt(3));
                     break;
                 case "DISTRIBUTED":
-                    deletedFiles =
+                    cleanOrphanFilesResult =
                             SparkOrphanFilesClean.executeDatabaseOrphanFiles(
                                     catalog,
                                     identifier.getDatabaseName(),
@@ -137,7 +140,12 @@ public InternalRow[] call(InternalRow args) {
                                     + mode
                                     + ". Only 'DISTRIBUTED' and 'LOCAL' are supported.");
             }
-            return new InternalRow[] {newInternalRow(deletedFiles)};
+
+            return new InternalRow[] {
+                newInternalRow(
+                        cleanOrphanFilesResult.getDeletedFileCount(),
+                        cleanOrphanFilesResult.getDeletedFileTotalLenInBytes())
+            };
         } catch (Exception e) {
             throw new RuntimeException(e);
         }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/orphan/SparkOrphanFilesClean.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/orphan/SparkOrphanFilesClean.scala
index 488d70e349356..fca0493ede287 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/orphan/SparkOrphanFilesClean.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/orphan/SparkOrphanFilesClean.scala
@@ -22,15 +22,14 @@ import org.apache.paimon.{utils, Snapshot}
 import org.apache.paimon.catalog.{Catalog, Identifier}
 import org.apache.paimon.fs.Path
 import org.apache.paimon.manifest.{ManifestEntry, ManifestFile}
-import org.apache.paimon.operation.OrphanFilesClean
+import org.apache.paimon.operation.{CleanOrphanFilesResult, OrphanFilesClean}
 import org.apache.paimon.operation.OrphanFilesClean.retryReadingFiles
 import org.apache.paimon.table.FileStoreTable
 import org.apache.paimon.utils.SerializableConsumer
 
 import org.apache.spark.internal.Logging
-import org.apache.spark.sql.{Dataset, SparkSession}
+import org.apache.spark.sql.{functions, Dataset, SparkSession}
 import org.apache.spark.sql.catalyst.SQLConfHelper
-import org.apache.spark.sql.functions.sum
 
 import java.util
 import java.util.Collections
@@ -50,14 +49,18 @@ case class SparkOrphanFilesClean(
   with SQLConfHelper
   with Logging {
 
-  def doOrphanClean(): (Dataset[Long], Dataset[BranchAndManifestFile]) = {
+  def doOrphanClean(): (Dataset[(Long, Long)], Dataset[BranchAndManifestFile]) = {
     import spark.implicits._
 
     val branches = validBranches()
-    val deletedInLocal = new AtomicLong(0)
+    val deletedFilesCountInLocal = new AtomicLong(0)
+    val deletedFilesLenInBytesInLocal = new AtomicLong(0)
     // snapshot and changelog files are the root of everything, so they are handled specially
     // here, and subsequently, we will not count their orphan files.
-    cleanSnapshotDir(branches, (_: Path) => deletedInLocal.incrementAndGet)
+    cleanSnapshotDir(
+      branches,
+      (_: Path) => deletedFilesCountInLocal.incrementAndGet,
+      size => deletedFilesLenInBytesInLocal.addAndGet(size))
 
     val maxBranchParallelism = Math.min(branches.size(), parallelism)
     // find snapshots using branch and find manifests(manifest, index, statistics) using snapshot
@@ -121,10 +124,10 @@ case class SparkOrphanFilesClean(
       .flatMap {
         dir =>
           tryBestListingDirs(new Path(dir)).asScala.filter(oldEnough).map {
-            file => (file.getPath.getName, file.getPath.toUri.toString)
+            file => (file.getPath.getName, file.getPath.toUri.toString, file.getLen)
           }
       }
-      .toDF("name", "path")
+      .toDF("name", "path", "len")
       .repartition(parallelism)
 
     // use left anti to filter files which is not used
@@ -132,21 +135,30 @@ case class SparkOrphanFilesClean(
       .join(usedFiles, $"name" === $"used_name", "left_anti")
       .mapPartitions {
         it =>
-          var deleted = 0L
+          var deletedFilesCount = 0L
+          var deletedFilesLenInBytes = 0L
+
           while (it.hasNext) {
-            val pathToClean = it.next().getString(1)
-            specifiedFileCleaner.accept(new Path(pathToClean))
+            val fileInfo = it.next();
+            val pathToClean = fileInfo.getString(1)
+            val deletedPath = new Path(pathToClean)
+            deletedFilesLenInBytes += fileInfo.getLong(2)
+            specifiedFileCleaner.accept(deletedPath)
             logInfo(s"Cleaned file: $pathToClean")
-            deleted += 1
+            deletedFilesCount += 1
           }
-          logInfo(s"Total cleaned files: $deleted");
-          Iterator.single(deleted)
+          logInfo(
+            s"Total cleaned files: $deletedFilesCount, Total cleaned files len : $deletedFilesLenInBytes")
+          Iterator.single((deletedFilesCount, deletedFilesLenInBytes))
+      }
+    val finalDeletedDataset =
+      if (deletedFilesCountInLocal.get() != 0 || deletedFilesLenInBytesInLocal.get() != 0) {
+        deleted.union(
+          spark.createDataset(
+            Seq((deletedFilesCountInLocal.get(), deletedFilesLenInBytesInLocal.get()))))
+      } else {
+        deleted
       }
-    val finalDeletedDataset = if (deletedInLocal.get() != 0) {
-      deleted.union(spark.createDataset(Seq(deletedInLocal.get())))
-    } else {
-      deleted
-    }
 
     (finalDeletedDataset, usedManifestFiles)
   }
@@ -169,7 +181,7 @@ object SparkOrphanFilesClean extends SQLConfHelper {
       tableName: String,
       olderThanMillis: Long,
       fileCleaner: SerializableConsumer[Path],
-      parallelismOpt: Integer): Long = {
+      parallelismOpt: Integer): CleanOrphanFilesResult = {
     val spark = SparkSession.active
     val parallelism = if (parallelismOpt == null) {
       Math.max(spark.sparkContext.defaultParallelism, conf.numShufflePartitions)
@@ -192,7 +204,7 @@ object SparkOrphanFilesClean extends SQLConfHelper {
         table.asInstanceOf[FileStoreTable]
     }
     if (tables.isEmpty) {
-      return 0
+      return new CleanOrphanFilesResult(0, 0)
     }
     val (deleted, waitToRelease) = tables.map {
       table =>
@@ -207,15 +219,15 @@ object SparkOrphanFilesClean extends SQLConfHelper {
     try {
       val result = deleted
         .reduce((l, r) => l.union(r))
-        .toDF("deleted")
-        .agg(sum("deleted"))
+        .toDF("deletedFilesCount", "deletedFilesLenInBytes")
+        .agg(functions.sum("deletedFilesCount"), functions.sum("deletedFilesLenInBytes"))
         .head()
-      assert(result.schema.size == 1, result.schema)
+      assert(result.schema.size == 2, result.schema)
       if (result.isNullAt(0)) {
         // no files can be deleted
-        0
+        new CleanOrphanFilesResult(0, 0)
       } else {
-        result.getLong(0)
+        new CleanOrphanFilesResult(result.getLong(0), result.getLong(1))
       }
     } finally {
       waitToRelease.foreach(_.unpersist())
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
index d9d73811266dd..3ffe7fba264f0 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
+++ b/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
@@ -52,7 +52,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     fileIO.tryToWriteAtomic(orphanFile2, "b")
 
     // by default, no file deleted
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
 
     val orphanFile2ModTime = fileIO.getFileStatus(orphanFile2).getModificationTime
     val older_than1 = DateTimeUtils.formatLocalDateTime(
@@ -63,7 +63,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
 
     checkAnswer(
       spark.sql(s"CALL sys.remove_orphan_files(table => 'T', older_than => '$older_than1')"),
-      Row(1) :: Nil)
+      Row(1, 1) :: Nil)
 
     val older_than2 = DateTimeUtils.formatLocalDateTime(
       DateTimeUtils.toLocalDateTime(System.currentTimeMillis()),
@@ -71,9 +71,9 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
 
     checkAnswer(
       spark.sql(s"CALL sys.remove_orphan_files(table => 'T', older_than => '$older_than2')"),
-      Row(1) :: Nil)
+      Row(1, 1) :: Nil)
 
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
   }
 
   test("Paimon procedure: dry run remove orphan files") {
@@ -97,7 +97,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     fileIO.writeFile(orphanFile2, "b", true)
 
     // by default, no file deleted
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
 
     val older_than = DateTimeUtils.formatLocalDateTime(
       DateTimeUtils.toLocalDateTime(System.currentTimeMillis()),
@@ -106,10 +106,10 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     checkAnswer(
       spark.sql(
         s"CALL sys.remove_orphan_files(table => 'T', older_than => '$older_than', dry_run => true)"),
-      Row(2) :: Nil
+      Row(2, 2) :: Nil
     )
 
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
   }
 
   test("Paimon procedure: remove database orphan files") {
@@ -146,7 +146,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     fileIO2.tryToWriteAtomic(orphanFile22, "b")
 
     // by default, no file deleted
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*')"), Row(0, 0) :: Nil)
 
     val orphanFile12ModTime = fileIO1.getFileStatus(orphanFile12).getModificationTime
     val older_than1 = DateTimeUtils.formatLocalDateTime(
@@ -157,7 +157,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
 
     checkAnswer(
       spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*', older_than => '$older_than1')"),
-      Row(2) :: Nil
+      Row(2, 2) :: Nil
     )
 
     val older_than2 = DateTimeUtils.formatLocalDateTime(
@@ -166,10 +166,10 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
 
     checkAnswer(
       spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*', older_than => '$older_than2')"),
-      Row(2) :: Nil
+      Row(2, 2) :: Nil
     )
 
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'test.*')"), Row(0, 0) :: Nil)
   }
 
   test("Paimon procedure: remove orphan files with mode") {
@@ -193,7 +193,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     fileIO.tryToWriteAtomic(orphanFile2, "b")
 
     // by default, no file deleted
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
 
     val orphanFile2ModTime = fileIO.getFileStatus(orphanFile2).getModificationTime
     val older_than1 = DateTimeUtils.formatLocalDateTime(
@@ -205,7 +205,7 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     checkAnswer(
       spark.sql(
         s"CALL sys.remove_orphan_files(table => 'T', older_than => '$older_than1', mode => 'diSTributed')"),
-      Row(1) :: Nil)
+      Row(1, 1) :: Nil)
 
     val older_than2 = DateTimeUtils.formatLocalDateTime(
       DateTimeUtils.toLocalDateTime(System.currentTimeMillis()),
@@ -214,9 +214,9 @@ class RemoveOrphanFilesProcedureTest extends PaimonSparkTestBase {
     checkAnswer(
       spark.sql(
         s"CALL sys.remove_orphan_files(table => 'T', older_than => '$older_than2', mode => 'local')"),
-      Row(1) :: Nil)
+      Row(1, 1) :: Nil)
 
-    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0) :: Nil)
+    checkAnswer(spark.sql(s"CALL sys.remove_orphan_files(table => 'T')"), Row(0, 0) :: Nil)
   }
 
 }

From ee466bcac14bd7f1229beeaf4e405da0956792ca Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 26 Nov 2024 13:07:43 +0800
Subject: [PATCH 061/157] [core] CleanOrphanFilesResult.deletedFilesPath should
 be nullable

---
 .../paimon/operation/CleanOrphanFilesResult.java | 16 +++++++++++-----
 .../paimon/operation/LocalOrphanFilesClean.java  |  4 ++--
 2 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java b/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java
index 5a3bc67f9c95e..d29eede720ac9 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/CleanOrphanFilesResult.java
@@ -20,24 +20,29 @@
 
 import org.apache.paimon.fs.Path;
 
+import javax.annotation.Nullable;
+
 import java.util.List;
 
 /** The result of OrphanFilesClean. */
 public class CleanOrphanFilesResult {
 
-    private List<Path> deletedFilesPath;
     private final long deletedFileCount;
     private final long deletedFileTotalLenInBytes;
 
+    @Nullable private final List<Path> deletedFilesPath;
+
     public CleanOrphanFilesResult(long deletedFileCount, long deletedFileTotalLenInBytes) {
-        this.deletedFileCount = deletedFileCount;
-        this.deletedFileTotalLenInBytes = deletedFileTotalLenInBytes;
+        this(deletedFileCount, deletedFileTotalLenInBytes, null);
     }
 
     public CleanOrphanFilesResult(
-            List<Path> deletedFilesPath, long deletedFileCount, long deletedFileTotalLenInBytes) {
-        this(deletedFileCount, deletedFileTotalLenInBytes);
+            long deletedFileCount,
+            long deletedFileTotalLenInBytes,
+            @Nullable List<Path> deletedFilesPath) {
         this.deletedFilesPath = deletedFilesPath;
+        this.deletedFileCount = deletedFileCount;
+        this.deletedFileTotalLenInBytes = deletedFileTotalLenInBytes;
     }
 
     public long getDeletedFileCount() {
@@ -48,6 +53,7 @@ public long getDeletedFileTotalLenInBytes() {
         return deletedFileTotalLenInBytes;
     }
 
+    @Nullable
     public List<Path> getDeletedFilesPath() {
         return deletedFilesPath;
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
index 511c5fc7fb79b..6a4276662468b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/LocalOrphanFilesClean.java
@@ -101,7 +101,7 @@ public CleanOrphanFilesResult clean()
         Map<String, Pair<Path, Long>> candidates = getCandidateDeletingFiles();
         if (candidates.isEmpty()) {
             return new CleanOrphanFilesResult(
-                    deleteFiles, deleteFiles.size(), deletedFilesLenInBytes.get());
+                    deleteFiles.size(), deletedFilesLenInBytes.get(), deleteFiles);
         }
         candidateDeletes = new HashSet<>(candidates.keySet());
 
@@ -128,7 +128,7 @@ public CleanOrphanFilesResult clean()
         candidateDeletes.clear();
 
         return new CleanOrphanFilesResult(
-                deleteFiles, deleteFiles.size(), deletedFilesLenInBytes.get());
+                deleteFiles.size(), deletedFilesLenInBytes.get(), deleteFiles);
     }
 
     private void collectWithoutDataFile(

From 61ee6f8f4526603deae5be44fffb8a0168823565 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Tue, 26 Nov 2024 14:27:22 +0800
Subject: [PATCH 062/157] [flink] Avoid deprecated usages about Configuration
 (#4584)

---
 .../apache/paimon/benchmark/QueryRunner.java  |  2 +-
 .../serialization/SerializerConfig.java       | 22 ++++++
 .../serialization/SerializerConfigImpl.java   | 22 ++++++
 .../serialization/SerializerConfig.java       | 22 ++++++
 .../serialization/SerializerConfigImpl.java   | 22 ++++++
 .../serialization/SerializerConfig.java       | 22 ++++++
 .../serialization/SerializerConfigImpl.java   | 22 ++++++
 .../serialization/SerializerConfig.java       | 22 ++++++
 .../serialization/SerializerConfigImpl.java   | 22 ++++++
 ...afkaDebeziumAvroDeserializationSchema.java |  2 +-
 .../strategy/MongoVersionStrategy.java        |  8 +--
 .../action/cdc/mysql/MySqlRecordParser.java   | 15 +++--
 ...lsarDebeziumAvroDeserializationSchema.java |  2 +-
 .../cdc/mongodb/MongodbSchemaITCase.java      | 67 +++++++++----------
 .../cdc/mysql/MySqlSyncTableActionITCase.java | 10 ++-
 .../sink/cdc/CdcRecordSerializeITCase.java    | 28 ++++++--
 .../changelog/ChangelogTaskTypeInfo.java      | 13 +++-
 .../flink/sink/CommittableTypeInfo.java       | 12 +++-
 .../flink/sink/CompactionTaskTypeInfo.java    | 12 +++-
 .../apache/paimon/flink/sink/FlinkSink.java   |  7 +-
 .../sink/MultiTableCommittableTypeInfo.java   | 12 +++-
 .../MultiTableCompactionTaskTypeInfo.java     | 13 +++-
 .../flink/source/FlinkSourceBuilder.java      | 16 ++---
 .../AlignedContinuousFileStoreSource.java     |  2 +-
 .../paimon/flink/utils/InternalTypeInfo.java  | 14 +++-
 .../paimon/flink/utils/JavaTypeInfo.java      | 16 ++++-
 .../paimon/flink/FileSystemCatalogITCase.java |  3 +-
 .../paimon/flink/FlinkJobRecoveryITCase.java  |  9 ++-
 .../paimon/flink/RescaleBucketITCase.java     |  4 +-
 .../UnawareBucketAppendOnlyTableITCase.java   | 14 +++-
 .../flink/sink/SinkSavepointITCase.java       |  2 +-
 .../paimon/flink/util/AbstractTestBase.java   | 14 ++--
 .../flink/util/ReadWriteTableTestUtil.java    | 26 ++++---
 .../paimon/hive/HiveCatalogITCaseBase.java    |  6 +-
 34 files changed, 396 insertions(+), 109 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java

diff --git a/paimon-benchmark/paimon-cluster-benchmark/src/main/java/org/apache/paimon/benchmark/QueryRunner.java b/paimon-benchmark/paimon-cluster-benchmark/src/main/java/org/apache/paimon/benchmark/QueryRunner.java
index b07cdef8465ee..8bfe4b6c9c03a 100644
--- a/paimon-benchmark/paimon-cluster-benchmark/src/main/java/org/apache/paimon/benchmark/QueryRunner.java
+++ b/paimon-benchmark/paimon-cluster-benchmark/src/main/java/org/apache/paimon/benchmark/QueryRunner.java
@@ -77,7 +77,7 @@ public Result run() {
 
             String sinkPathConfig =
                     BenchmarkGlobalConfiguration.loadConfiguration()
-                            .getString(BenchmarkOptions.SINK_PATH);
+                            .get(BenchmarkOptions.SINK_PATH);
             if (sinkPathConfig == null) {
                 throw new IllegalArgumentException(
                         BenchmarkOptions.SINK_PATH.key() + " must be set");
diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
new file mode 100644
index 0000000000000..16987469a948f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
new file mode 100644
index 0000000000000..374d33f6500d5
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public class SerializerConfigImpl implements SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
new file mode 100644
index 0000000000000..16987469a948f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
new file mode 100644
index 0000000000000..374d33f6500d5
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public class SerializerConfigImpl implements SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
new file mode 100644
index 0000000000000..16987469a948f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
new file mode 100644
index 0000000000000..374d33f6500d5
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public class SerializerConfigImpl implements SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
new file mode 100644
index 0000000000000..16987469a948f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfig.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
new file mode 100644
index 0000000000000..374d33f6500d5
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/common/serialization/SerializerConfigImpl.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.common.serialization;
+
+/** Placeholder class to resolve compatibility issues. */
+public class SerializerConfigImpl implements SerializerConfig {}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/kafka/KafkaDebeziumAvroDeserializationSchema.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/kafka/KafkaDebeziumAvroDeserializationSchema.java
index fc672b9dc0ab6..eea364d460dee 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/kafka/KafkaDebeziumAvroDeserializationSchema.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/kafka/KafkaDebeziumAvroDeserializationSchema.java
@@ -48,7 +48,7 @@ public class KafkaDebeziumAvroDeserializationSchema
 
     public KafkaDebeziumAvroDeserializationSchema(Configuration cdcSourceConfig) {
         this.topic = KafkaActionUtils.findOneTopic(cdcSourceConfig);
-        this.schemaRegistryUrl = cdcSourceConfig.getString(SCHEMA_REGISTRY_URL);
+        this.schemaRegistryUrl = cdcSourceConfig.get(SCHEMA_REGISTRY_URL);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mongodb/strategy/MongoVersionStrategy.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mongodb/strategy/MongoVersionStrategy.java
index 64f127571134b..df288a4150e63 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mongodb/strategy/MongoVersionStrategy.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mongodb/strategy/MongoVersionStrategy.java
@@ -83,7 +83,7 @@ default Map<String, String> getExtractRow(
             Configuration mongodbConfig)
             throws JsonProcessingException {
         SchemaAcquisitionMode mode =
-                SchemaAcquisitionMode.valueOf(mongodbConfig.getString(START_MODE).toUpperCase());
+                SchemaAcquisitionMode.valueOf(mongodbConfig.get(START_MODE).toUpperCase());
         ObjectNode objectNode =
                 JsonSerdeUtil.asSpecificNodeType(jsonNode.asText(), ObjectNode.class);
         JsonNode idNode = objectNode.get(ID_FIELD);
@@ -92,7 +92,7 @@ default Map<String, String> getExtractRow(
                     "The provided MongoDB JSON document does not contain an _id field.");
         }
         JsonNode document =
-                mongodbConfig.getBoolean(DEFAULT_ID_GENERATION)
+                mongodbConfig.get(DEFAULT_ID_GENERATION)
                         ? objectNode.set(
                                 ID_FIELD,
                                 idNode.get(OID_FIELD) == null ? idNode : idNode.get(OID_FIELD))
@@ -101,8 +101,8 @@ default Map<String, String> getExtractRow(
             case SPECIFIED:
                 return parseFieldsFromJsonRecord(
                         document.toString(),
-                        mongodbConfig.getString(PARSER_PATH),
-                        mongodbConfig.getString(FIELD_NAME),
+                        mongodbConfig.get(PARSER_PATH),
+                        mongodbConfig.get(FIELD_NAME),
                         computedColumns,
                         rowTypeBuilder);
             case DYNAMIC:
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlRecordParser.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlRecordParser.java
index 502e6237a477e..26579e718f564 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlRecordParser.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlRecordParser.java
@@ -45,6 +45,8 @@
 import org.apache.flink.api.common.functions.FlatMapFunction;
 import org.apache.flink.cdc.connectors.mysql.source.config.MySqlSourceOptions;
 import org.apache.flink.cdc.debezium.table.DebeziumOptions;
+import org.apache.flink.configuration.ConfigOption;
+import org.apache.flink.configuration.ConfigOptions;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.util.Collector;
 import org.slf4j.Logger;
@@ -99,11 +101,14 @@ public MySqlRecordParser(
                 .configure(DeserializationFeature.FAIL_ON_UNKNOWN_PROPERTIES, false);
         String stringifyServerTimeZone = mySqlConfig.get(MySqlSourceOptions.SERVER_TIME_ZONE);
 
-        this.isDebeziumSchemaCommentsEnabled =
-                mySqlConfig.getBoolean(
-                        DebeziumOptions.DEBEZIUM_OPTIONS_PREFIX
-                                + RelationalDatabaseConnectorConfig.INCLUDE_SCHEMA_COMMENTS.name(),
-                        false);
+        ConfigOption<Boolean> includeSchemaCommentsConfig =
+                ConfigOptions.key(
+                                DebeziumOptions.DEBEZIUM_OPTIONS_PREFIX
+                                        + RelationalDatabaseConnectorConfig.INCLUDE_SCHEMA_COMMENTS
+                                                .name())
+                        .booleanType()
+                        .defaultValue(false);
+        this.isDebeziumSchemaCommentsEnabled = mySqlConfig.get(includeSchemaCommentsConfig);
         this.serverTimeZone =
                 stringifyServerTimeZone == null
                         ? ZoneId.systemDefault()
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/pulsar/PulsarDebeziumAvroDeserializationSchema.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/pulsar/PulsarDebeziumAvroDeserializationSchema.java
index b0d1d1bf620f5..f45ee034bec84 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/pulsar/PulsarDebeziumAvroDeserializationSchema.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/pulsar/PulsarDebeziumAvroDeserializationSchema.java
@@ -46,7 +46,7 @@ public class PulsarDebeziumAvroDeserializationSchema
 
     public PulsarDebeziumAvroDeserializationSchema(Configuration cdcSourceConfig) {
         this.topic = PulsarActionUtils.findOneTopic(cdcSourceConfig);
-        this.schemaRegistryUrl = cdcSourceConfig.getString(SCHEMA_REGISTRY_URL);
+        this.schemaRegistryUrl = cdcSourceConfig.get(SCHEMA_REGISTRY_URL);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mongodb/MongodbSchemaITCase.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mongodb/MongodbSchemaITCase.java
index 394cdd1f149bc..f0328b5663246 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mongodb/MongodbSchemaITCase.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mongodb/MongodbSchemaITCase.java
@@ -76,13 +76,12 @@ public static void initMongoDB() {
     @Test
     public void testCreateSchemaFromValidConfig() {
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
-        mongodbConfig.setString(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
-        mongodbConfig.setString(
-                MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
-        mongodbConfig.setString(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
-        mongodbConfig.setString(MongoDBSourceOptions.DATABASE, "testDatabase");
-        mongodbConfig.setString(MongoDBSourceOptions.COLLECTION, "testCollection");
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
+        mongodbConfig.set(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
+        mongodbConfig.set(MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
+        mongodbConfig.set(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
+        mongodbConfig.set(MongoDBSourceOptions.DATABASE, "testDatabase");
+        mongodbConfig.set(MongoDBSourceOptions.COLLECTION, "testCollection");
         Schema schema = MongodbSchemaUtils.getMongodbSchema(mongodbConfig);
         assertNotNull(schema);
     }
@@ -90,13 +89,12 @@ public void testCreateSchemaFromValidConfig() {
     @Test
     public void testCreateSchemaFromInvalidHost() {
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, "127.0.0.1:12345");
-        mongodbConfig.setString(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
-        mongodbConfig.setString(
-                MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
-        mongodbConfig.setString(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
-        mongodbConfig.setString(MongoDBSourceOptions.DATABASE, "testDatabase");
-        mongodbConfig.setString(MongoDBSourceOptions.COLLECTION, "testCollection");
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, "127.0.0.1:12345");
+        mongodbConfig.set(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
+        mongodbConfig.set(MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
+        mongodbConfig.set(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
+        mongodbConfig.set(MongoDBSourceOptions.DATABASE, "testDatabase");
+        mongodbConfig.set(MongoDBSourceOptions.COLLECTION, "testCollection");
 
         assertThrows(
                 RuntimeException.class, () -> MongodbSchemaUtils.getMongodbSchema(mongodbConfig));
@@ -106,7 +104,7 @@ public void testCreateSchemaFromInvalidHost() {
     public void testCreateSchemaFromIncompleteConfig() {
         // Create a Configuration object with missing necessary settings
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
         // Expect an exception to be thrown due to missing necessary settings
         assertThrows(
                 NullPointerException.class,
@@ -117,13 +115,12 @@ public void testCreateSchemaFromIncompleteConfig() {
     public void testCreateSchemaFromDynamicConfig() {
         // Create a Configuration object with the necessary settings
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
-        mongodbConfig.setString(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
-        mongodbConfig.setString(
-                MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
-        mongodbConfig.setString(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
-        mongodbConfig.setString(MongoDBSourceOptions.DATABASE, "testDatabase");
-        mongodbConfig.setString(MongoDBSourceOptions.COLLECTION, "testCollection");
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
+        mongodbConfig.set(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
+        mongodbConfig.set(MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
+        mongodbConfig.set(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
+        mongodbConfig.set(MongoDBSourceOptions.DATABASE, "testDatabase");
+        mongodbConfig.set(MongoDBSourceOptions.COLLECTION, "testCollection");
 
         // Call the method and check the results
         Schema schema = MongodbSchemaUtils.getMongodbSchema(mongodbConfig);
@@ -142,13 +139,12 @@ public void testCreateSchemaFromDynamicConfig() {
     @Test
     public void testCreateSchemaFromInvalidDatabase() {
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
-        mongodbConfig.setString(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
-        mongodbConfig.setString(
-                MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
-        mongodbConfig.setString(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
-        mongodbConfig.setString(MongoDBSourceOptions.DATABASE, "invalidDatabase");
-        mongodbConfig.setString(MongoDBSourceOptions.COLLECTION, "testCollection");
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
+        mongodbConfig.set(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
+        mongodbConfig.set(MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
+        mongodbConfig.set(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
+        mongodbConfig.set(MongoDBSourceOptions.DATABASE, "invalidDatabase");
+        mongodbConfig.set(MongoDBSourceOptions.COLLECTION, "testCollection");
 
         assertThrows(
                 RuntimeException.class, () -> MongodbSchemaUtils.getMongodbSchema(mongodbConfig));
@@ -157,13 +153,12 @@ public void testCreateSchemaFromInvalidDatabase() {
     @Test
     public void testCreateSchemaFromInvalidCollection() {
         Configuration mongodbConfig = new Configuration();
-        mongodbConfig.setString(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
-        mongodbConfig.setString(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
-        mongodbConfig.setString(
-                MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
-        mongodbConfig.setString(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
-        mongodbConfig.setString(MongoDBSourceOptions.DATABASE, "testDatabase");
-        mongodbConfig.setString(MongoDBSourceOptions.COLLECTION, "invalidCollection");
+        mongodbConfig.set(MongoDBSourceOptions.HOSTS, MONGODB_CONTAINER.getHostAndPort());
+        mongodbConfig.set(MongoDBSourceOptions.USERNAME, MongoDBContainer.PAIMON_USER);
+        mongodbConfig.set(MongoDBSourceOptions.PASSWORD, MongoDBContainer.PAIMON_USER_PASSWORD);
+        mongodbConfig.set(MongoDBSourceOptions.CONNECTION_OPTIONS, "authSource=admin");
+        mongodbConfig.set(MongoDBSourceOptions.DATABASE, "testDatabase");
+        mongodbConfig.set(MongoDBSourceOptions.COLLECTION, "invalidCollection");
 
         assertThrows(
                 RuntimeException.class, () -> MongodbSchemaUtils.getMongodbSchema(mongodbConfig));
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncTableActionITCase.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncTableActionITCase.java
index bdeab07a746cc..febbe4e1deaad 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncTableActionITCase.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncTableActionITCase.java
@@ -31,7 +31,8 @@
 import org.apache.paimon.utils.CommonTestUtils;
 import org.apache.paimon.utils.JsonSerdeUtil;
 
-import org.apache.flink.api.common.restartstrategy.RestartStrategies;
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.configuration.RestartStrategyOptions;
 import org.apache.flink.core.execution.JobClient;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.junit.jupiter.api.BeforeAll;
@@ -1285,8 +1286,11 @@ public void testDefaultCheckpointInterval() throws Exception {
         mySqlConfig.put("database-name", "default_checkpoint");
         mySqlConfig.put("table-name", "t");
 
-        StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
-        env.setRestartStrategy(RestartStrategies.noRestart());
+        // Using `none` to avoid compatibility issues with Flink 1.18-.
+        Configuration configuration = new Configuration();
+        configuration.set(RestartStrategyOptions.RESTART_STRATEGY, "none");
+        StreamExecutionEnvironment env =
+                StreamExecutionEnvironment.getExecutionEnvironment(configuration);
 
         MySqlSyncTableAction action = syncTableActionBuilder(mySqlConfig).build();
         action.withStreamExecutionEnvironment(env);
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordSerializeITCase.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordSerializeITCase.java
index 698900436e8d5..b202ca53c9cc9 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordSerializeITCase.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordSerializeITCase.java
@@ -25,6 +25,8 @@
 import org.apache.paimon.types.VarCharType;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
+import org.apache.flink.api.common.serialization.SerializerConfigImpl;
 import org.apache.flink.api.java.typeutils.runtime.kryo.KryoSerializer;
 import org.apache.flink.core.memory.DataInputView;
 import org.apache.flink.core.memory.DataOutputView;
@@ -35,6 +37,8 @@
 import java.io.DataInputStream;
 import java.io.DataOutputStream;
 import java.io.IOException;
+import java.lang.reflect.Constructor;
+import java.lang.reflect.InvocationTargetException;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
@@ -49,7 +53,7 @@
 public class CdcRecordSerializeITCase {
 
     @Test
-    public void testCdcRecordKryoSerialize() throws IOException {
+    public void testCdcRecordKryoSerialize() throws Exception {
         KryoSerializer<RichCdcMultiplexRecord> kr =
                 createFlinkKryoSerializer(RichCdcMultiplexRecord.class);
         RowType.Builder rowType = RowType.builder();
@@ -78,7 +82,7 @@ public void testCdcRecordKryoSerialize() throws IOException {
     }
 
     @Test
-    public void testUnmodifiableListKryoSerialize() throws IOException {
+    public void testUnmodifiableListKryoSerialize() throws Exception {
         KryoSerializer<List> kryoSerializer = createFlinkKryoSerializer(List.class);
         RowType.Builder rowType = RowType.builder();
         rowType.field("id", new BigIntType());
@@ -101,8 +105,24 @@ public void testUnmodifiableListKryoSerialize() throws IOException {
         assertThat(deserializeRecord).isEqualTo(fields);
     }
 
-    public static <T> KryoSerializer<T> createFlinkKryoSerializer(Class<T> type) {
-        return new KryoSerializer<>(type, new ExecutionConfig());
+    @SuppressWarnings({"unchecked", "rawtypes"})
+    public static <T> KryoSerializer<T> createFlinkKryoSerializer(Class<T> type)
+            throws NoSuchMethodException, InvocationTargetException, InstantiationException,
+                    IllegalAccessException {
+        try {
+            Constructor<KryoSerializer> constructor =
+                    KryoSerializer.class.getConstructor(Class.class, SerializerConfig.class);
+            return (KryoSerializer<T>) constructor.newInstance(type, new SerializerConfigImpl());
+        } catch (NoSuchMethodException
+                | InvocationTargetException
+                | IllegalAccessException
+                | InstantiationException e) {
+            // to stay compatible with Flink 1.18-
+        }
+
+        Constructor<KryoSerializer> constructor =
+                KryoSerializer.class.getConstructor(Class.class, ExecutionConfig.class);
+        return (KryoSerializer<T>) constructor.newInstance(type, new ExecutionConfig());
     }
 
     private static final class TestOutputView extends DataOutputStream implements DataOutputView {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/ChangelogTaskTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/ChangelogTaskTypeInfo.java
index 5cae899a07040..a529e6764faea 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/ChangelogTaskTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/changelog/ChangelogTaskTypeInfo.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.flink.sink.NoneCopyVersionedSerializerTypeSerializerProxy;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 
@@ -56,7 +57,17 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<ChangelogCompactTask> createSerializer(
+            SerializerConfig serializerConfig) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<ChangelogCompactTask> createSerializer(ExecutionConfig config) {
         // we don't need copy for task
         return new NoneCopyVersionedSerializerTypeSerializerProxy<ChangelogCompactTask>(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommittableTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommittableTypeInfo.java
index dcb87238b8337..92e826a913792 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommittableTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommittableTypeInfo.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.table.sink.CommitMessageSerializer;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 
@@ -57,7 +58,16 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<Committable> createSerializer(SerializerConfig config) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<Committable> createSerializer(ExecutionConfig config) {
         // no copy, so that data from writer is directly going into committer while chaining
         return new NoneCopyVersionedSerializerTypeSerializerProxy<Committable>(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactionTaskTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactionTaskTypeInfo.java
index 47defa61a9713..6510a85b800af 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactionTaskTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactionTaskTypeInfo.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.table.sink.CompactionTaskSerializer;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 
@@ -58,7 +59,16 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<UnawareAppendCompactionTask> createSerializer(SerializerConfig config) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<UnawareAppendCompactionTask> createSerializer(ExecutionConfig config) {
         // we don't need copy for task
         return new NoneCopyVersionedSerializerTypeSerializerProxy<UnawareAppendCompactionTask>(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
index 59f2f4b1035f0..dd364c196d8bf 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
@@ -42,7 +42,6 @@
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
-import org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
@@ -338,13 +337,11 @@ public static void assertStreamingConfiguration(StreamExecutionEnvironment env)
         checkArgument(
                 !env.getCheckpointConfig().isUnalignedCheckpointsEnabled(),
                 "Paimon sink currently does not support unaligned checkpoints. Please set "
-                        + ExecutionCheckpointingOptions.ENABLE_UNALIGNED.key()
-                        + " to false.");
+                        + "execution.checkpointing.unaligned.enabled to false.");
         checkArgument(
                 env.getCheckpointConfig().getCheckpointingMode() == CheckpointingMode.EXACTLY_ONCE,
                 "Paimon sink currently only supports EXACTLY_ONCE checkpoint mode. Please set "
-                        + ExecutionCheckpointingOptions.CHECKPOINTING_MODE.key()
-                        + " to exactly-once");
+                        + "execution.checkpointing.mode to exactly-once");
     }
 
     public static void assertBatchAdaptiveParallelism(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCommittableTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCommittableTypeInfo.java
index f82f082098671..7da0ae0e20788 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCommittableTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCommittableTypeInfo.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.table.sink.CommitMessageSerializer;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 
@@ -57,7 +58,16 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<MultiTableCommittable> createSerializer(SerializerConfig config) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<MultiTableCommittable> createSerializer(ExecutionConfig config) {
         // no copy, so that data from writer is directly going into committer while chaining
         return new NoneCopyVersionedSerializerTypeSerializerProxy<MultiTableCommittable>(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCompactionTaskTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCompactionTaskTypeInfo.java
index f27f29f87fe74..0116ff198811e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCompactionTaskTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTableCompactionTaskTypeInfo.java
@@ -23,6 +23,7 @@
 import org.apache.paimon.table.sink.MultiTableCompactionTaskSerializer;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 import org.apache.flink.core.io.SimpleVersionedSerializerTypeSerializerProxy;
@@ -60,7 +61,17 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<MultiTableUnawareAppendCompactionTask> createSerializer(
+            SerializerConfig serializerConfig) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<MultiTableUnawareAppendCompactionTask> createSerializer(
             ExecutionConfig executionConfig) {
         return new SimpleVersionedSerializerTypeSerializerProxy<
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
index b3dcd4840cc1b..e864ec0500459 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
@@ -46,7 +46,6 @@
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
-import org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.data.util.DataFormatConverters;
@@ -331,30 +330,25 @@ private void assertStreamingConfigurationForAlignMode(StreamExecutionEnvironment
         checkArgument(
                 checkpointConfig.isCheckpointingEnabled(),
                 "The align mode of paimon source is only supported when checkpoint enabled. Please set "
-                        + ExecutionCheckpointingOptions.CHECKPOINTING_INTERVAL.key()
-                        + "larger than 0");
+                        + "execution.checkpointing.interval larger than 0");
         checkArgument(
                 checkpointConfig.getMaxConcurrentCheckpoints() == 1,
                 "The align mode of paimon source supports at most one ongoing checkpoint at the same time. Please set "
-                        + ExecutionCheckpointingOptions.MAX_CONCURRENT_CHECKPOINTS.key()
-                        + " to 1");
+                        + "execution.checkpointing.max-concurrent-checkpoints to 1");
         checkArgument(
                 checkpointConfig.getCheckpointTimeout()
                         > conf.get(FlinkConnectorOptions.SOURCE_CHECKPOINT_ALIGN_TIMEOUT)
                                 .toMillis(),
                 "The align mode of paimon source requires that the timeout of checkpoint is greater than the timeout of the source's snapshot alignment. Please increase "
-                        + ExecutionCheckpointingOptions.CHECKPOINTING_TIMEOUT.key()
-                        + " or decrease "
+                        + "execution.checkpointing.timeout or decrease "
                         + FlinkConnectorOptions.SOURCE_CHECKPOINT_ALIGN_TIMEOUT.key());
         checkArgument(
                 !env.getCheckpointConfig().isUnalignedCheckpointsEnabled(),
                 "The align mode of paimon source currently does not support unaligned checkpoints. Please set "
-                        + ExecutionCheckpointingOptions.ENABLE_UNALIGNED.key()
-                        + " to false.");
+                        + "execution.checkpointing.unaligned.enabled to false.");
         checkArgument(
                 env.getCheckpointConfig().getCheckpointingMode() == CheckpointingMode.EXACTLY_ONCE,
                 "The align mode of paimon source currently only supports EXACTLY_ONCE checkpoint mode. Please set "
-                        + ExecutionCheckpointingOptions.CHECKPOINTING_MODE.key()
-                        + " to exactly-once");
+                        + "execution.checkpointing.mode to exactly-once");
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedContinuousFileStoreSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedContinuousFileStoreSource.java
index d6b7060763acf..705e1d9a7a4c5 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedContinuousFileStoreSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedContinuousFileStoreSource.java
@@ -73,7 +73,7 @@ public SourceReader<RowData, FileStoreSourceSplit> createReader(SourceReaderCont
                 limit,
                 new FutureCompletingBlockingQueue<>(
                         context.getConfiguration()
-                                .getInteger(SourceReaderOptions.ELEMENT_QUEUE_CAPACITY)));
+                                .get(SourceReaderOptions.ELEMENT_QUEUE_CAPACITY)));
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/InternalTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/InternalTypeInfo.java
index 4ea5db9f34d48..60898421ddea2 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/InternalTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/InternalTypeInfo.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.types.RowType;
 
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeSerializer;
 
@@ -73,8 +74,17 @@ public boolean isKeyType() {
         return false;
     }
 
-    @Override
-    public TypeSerializer<T> createSerializer(ExecutionConfig config) {
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<T> createSerializer(SerializerConfig config) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
+    public TypeSerializer<T> createSerializer(ExecutionConfig executionConfig) {
         return serializer.duplicate();
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/JavaTypeInfo.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/JavaTypeInfo.java
index a36243c5bdacb..4aea809b51bc8 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/JavaTypeInfo.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/JavaTypeInfo.java
@@ -20,6 +20,7 @@
 
 import org.apache.flink.annotation.PublicEvolving;
 import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.serialization.SerializerConfig;
 import org.apache.flink.api.common.typeinfo.AtomicType;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.api.common.typeutils.TypeComparator;
@@ -78,7 +79,16 @@ public boolean isKeyType() {
         return Comparable.class.isAssignableFrom(typeClass);
     }
 
-    @Override
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     */
+    public TypeSerializer<T> createSerializer(SerializerConfig config) {
+        return this.createSerializer((ExecutionConfig) null);
+    }
+
+    /**
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     */
     public TypeSerializer<T> createSerializer(ExecutionConfig config) {
         return new JavaSerializer<>(this.typeClass);
     }
@@ -91,7 +101,9 @@ public TypeComparator<T> createComparator(
             @SuppressWarnings("rawtypes")
             GenericTypeComparator comparator =
                     new GenericTypeComparator(
-                            sortOrderAscending, createSerializer(executionConfig), this.typeClass);
+                            sortOrderAscending,
+                            new JavaSerializer<>(this.typeClass),
+                            this.typeClass);
             return (TypeComparator<T>) comparator;
         }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileSystemCatalogITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileSystemCatalogITCase.java
index 239043ff79e1d..915c93680a0dc 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileSystemCatalogITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileSystemCatalogITCase.java
@@ -27,7 +27,6 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.utils.BlockingIterator;
 
-import org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions;
 import org.apache.flink.table.api.TableEnvironment;
 import org.apache.flink.types.Row;
 import org.apache.flink.util.CloseableIterator;
@@ -60,7 +59,7 @@ public void setup() {
                 tableEnvironmentBuilder()
                         .streamingMode()
                         .parallelism(1)
-                        .setConf(ExecutionCheckpointingOptions.ENABLE_UNALIGNED, false)
+                        .setString("execution.checkpointing.unaligned.enabled", "false")
                         .build();
         path = getTempDirPath();
         tEnv.executeSql(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkJobRecoveryITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkJobRecoveryITCase.java
index c46c4c3589222..8df379a71b786 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkJobRecoveryITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkJobRecoveryITCase.java
@@ -65,7 +65,7 @@ public void before() throws IOException {
                 .set(
                         CheckpointingOptions.EXTERNALIZED_CHECKPOINT_RETENTION,
                         ExternalizedCheckpointRetention.RETAIN_ON_CANCELLATION)
-                .removeConfig(CheckpointingOptions.CHECKPOINTING_INTERVAL);
+                .removeKey("execution.checkpointing.interval");
 
         // insert source data
         batchSql("INSERT INTO source_table1 VALUES (1, 'test-1', '20241030')");
@@ -219,10 +219,9 @@ private void testRecoverFromSavepoint(
             batchSql(sql);
         }
 
-        Configuration config =
-                sEnv.getConfig()
-                        .getConfiguration()
-                        .set(StateRecoveryOptions.SAVEPOINT_PATH, checkpointPath);
+        Configuration config = sEnv.getConfig().getConfiguration();
+        // use config string to stay compatible with flink 1.19-
+        config.setString("execution.state-recovery.path", checkpointPath);
         for (Map.Entry<String, String> entry : recoverOptions.entrySet()) {
             config.setString(entry.getKey(), entry.getValue());
         }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/RescaleBucketITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/RescaleBucketITCase.java
index 08969bddfdb3a..d5747d2e28d4b 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/RescaleBucketITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/RescaleBucketITCase.java
@@ -26,7 +26,6 @@
 
 import org.apache.flink.core.execution.JobClient;
 import org.apache.flink.core.execution.SavepointFormatType;
-import org.apache.flink.runtime.jobgraph.SavepointConfigOptions;
 import org.apache.flink.types.Row;
 import org.junit.jupiter.api.Test;
 
@@ -106,9 +105,10 @@ public void testSuspendAndRecoverAfterRescaleOverwrite() throws Exception {
         assertThat(batchSql("SELECT * FROM T3")).containsExactlyInAnyOrderElementsOf(committedData);
 
         // step5: resume streaming job
+        // use config string to stay compatible with flink 1.19-
         sEnv.getConfig()
                 .getConfiguration()
-                .set(SavepointConfigOptions.SAVEPOINT_PATH, savepointPath);
+                .setString("execution.state-recovery.path", savepointPath);
         JobClient resumedJobClient =
                 startJobAndCommitSnapshot(streamSql, snapshotAfterRescale.id());
         // stop job
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
index f6dfb1b23046b..6ca78b088fb79 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
@@ -28,6 +28,7 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.FileStoreTableFactory;
 import org.apache.paimon.utils.FailingFileIO;
+import org.apache.paimon.utils.TimeUtils;
 
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
@@ -50,7 +51,6 @@
 import java.util.List;
 import java.util.Random;
 
-import static org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions.CHECKPOINTING_INTERVAL;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
@@ -203,7 +203,11 @@ public void testCompactionInStreamingMode() throws Exception {
         batchSql("ALTER TABLE append_table SET ('compaction.early-max.file-num' = '4')");
         batchSql("ALTER TABLE append_table SET ('continuous.discovery-interval' = '1 s')");
 
-        sEnv.getConfig().getConfiguration().set(CHECKPOINTING_INTERVAL, Duration.ofMillis(500));
+        sEnv.getConfig()
+                .getConfiguration()
+                .setString(
+                        "execution.checkpointing.interval",
+                        TimeUtils.formatWithHighestUnit(Duration.ofMillis(500)));
         sEnv.executeSql(
                 "CREATE TEMPORARY TABLE Orders_in (\n"
                         + "    f0        INT,\n"
@@ -224,7 +228,11 @@ public void testCompactionInStreamingModeWithMaxWatermark() throws Exception {
         batchSql("ALTER TABLE append_table SET ('compaction.early-max.file-num' = '4')");
         batchSql("ALTER TABLE append_table SET ('continuous.discovery-interval' = '1 s')");
 
-        sEnv.getConfig().getConfiguration().set(CHECKPOINTING_INTERVAL, Duration.ofMillis(500));
+        sEnv.getConfig()
+                .getConfiguration()
+                .setString(
+                        "execution.checkpointing.interval",
+                        TimeUtils.formatWithHighestUnit(Duration.ofMillis(500)));
         sEnv.executeSql(
                 "CREATE TEMPORARY TABLE Orders_in (\n"
                         + "    f0        INT,\n"
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/SinkSavepointITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/SinkSavepointITCase.java
index 6b912d2e57fe9..b1486deacb0c6 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/SinkSavepointITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/SinkSavepointITCase.java
@@ -137,7 +137,7 @@ private JobClient runRecoverFromSavepointJob(String failingPath, String savepoin
                         .parallelism(1)
                         .allowRestart()
                         .setConf(conf)
-                        .setConf(StateBackendOptions.STATE_BACKEND, "filesystem")
+                        .setConf(StateBackendOptions.STATE_BACKEND, "hashmap")
                         .setConf(
                                 CheckpointingOptions.CHECKPOINTS_DIRECTORY,
                                 "file://" + path + "/checkpoint")
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/AbstractTestBase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/AbstractTestBase.java
index ce0017eb18747..ee838ed68255e 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/AbstractTestBase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/AbstractTestBase.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.flink.util;
 
 import org.apache.paimon.utils.FileIOUtils;
+import org.apache.paimon.utils.TimeUtils;
 
 import org.apache.flink.api.common.RuntimeExecutionMode;
 import org.apache.flink.api.dag.Transformation;
@@ -29,7 +30,6 @@
 import org.apache.flink.runtime.client.JobStatusMessage;
 import org.apache.flink.runtime.testutils.MiniClusterResourceConfiguration;
 import org.apache.flink.streaming.api.CheckpointingMode;
-import org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.table.api.EnvironmentSettings;
 import org.apache.flink.table.api.TableEnvironment;
@@ -164,6 +164,11 @@ public <T> TableEnvironmentBuilder setConf(ConfigOption<T> option, T value) {
             return this;
         }
 
+        public TableEnvironmentBuilder setString(String key, String value) {
+            conf.setString(key, value);
+            return this;
+        }
+
         public TableEnvironmentBuilder setConf(Configuration conf) {
             this.conf.addAll(conf);
             return this;
@@ -182,9 +187,10 @@ public TableEnvironment build() {
                 if (checkpointIntervalMs != null) {
                     tEnv.getConfig()
                             .getConfiguration()
-                            .set(
-                                    ExecutionCheckpointingOptions.CHECKPOINTING_INTERVAL,
-                                    Duration.ofMillis(checkpointIntervalMs));
+                            .setString(
+                                    "execution.checkpointing.interval",
+                                    TimeUtils.formatWithHighestUnit(
+                                            Duration.ofMillis(checkpointIntervalMs)));
                 }
             } else {
                 tEnv =
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
index 86b0014eb39cf..9c3170f9a96b1 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
@@ -23,8 +23,9 @@
 import org.apache.paimon.utils.BlockingIterator;
 
 import org.apache.flink.api.common.RuntimeExecutionMode;
-import org.apache.flink.api.common.restartstrategy.RestartStrategies;
 import org.apache.flink.api.common.time.Time;
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.configuration.RestartStrategyOptions;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.table.api.EnvironmentSettings;
 import org.apache.flink.table.api.TableEnvironment;
@@ -75,12 +76,11 @@ public static void init(String warehouse) {
     }
 
     public static void init(String warehouse, int parallelism) {
-        StreamExecutionEnvironment sExeEnv = buildStreamEnv(parallelism);
-        sExeEnv.getConfig().setRestartStrategy(RestartStrategies.noRestart());
+        // Using `none` to avoid compatibility issues with Flink 1.18-.
+        StreamExecutionEnvironment sExeEnv = buildStreamEnv(parallelism, "none");
         sEnv = StreamTableEnvironment.create(sExeEnv);
 
-        bExeEnv = buildBatchEnv(parallelism);
-        bExeEnv.getConfig().setRestartStrategy(RestartStrategies.noRestart());
+        bExeEnv = buildBatchEnv(parallelism, "none");
         bEnv = StreamTableEnvironment.create(bExeEnv, EnvironmentSettings.inBatchMode());
 
         ReadWriteTableTestUtil.warehouse = warehouse;
@@ -95,16 +95,24 @@ public static void init(String warehouse, int parallelism) {
         bEnv.useCatalog(catalog);
     }
 
-    public static StreamExecutionEnvironment buildStreamEnv(int parallelism) {
-        final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
+    public static StreamExecutionEnvironment buildStreamEnv(
+            int parallelism, String restartStrategy) {
+        Configuration configuration = new Configuration();
+        configuration.set(RestartStrategyOptions.RESTART_STRATEGY, restartStrategy);
+        final StreamExecutionEnvironment env =
+                StreamExecutionEnvironment.getExecutionEnvironment(configuration);
         env.setRuntimeMode(RuntimeExecutionMode.STREAMING);
         env.enableCheckpointing(100);
         env.setParallelism(parallelism);
         return env;
     }
 
-    public static StreamExecutionEnvironment buildBatchEnv(int parallelism) {
-        final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
+    public static StreamExecutionEnvironment buildBatchEnv(
+            int parallelism, String restartStrategy) {
+        Configuration configuration = new Configuration();
+        configuration.set(RestartStrategyOptions.RESTART_STRATEGY, restartStrategy);
+        final StreamExecutionEnvironment env =
+                StreamExecutionEnvironment.getExecutionEnvironment(configuration);
         env.setRuntimeMode(RuntimeExecutionMode.BATCH);
         env.setParallelism(parallelism);
         return env;
diff --git a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveCatalogITCaseBase.java b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveCatalogITCaseBase.java
index 74d2d7e1c3437..2266a8484d9d2 100644
--- a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveCatalogITCaseBase.java
+++ b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/hive/HiveCatalogITCaseBase.java
@@ -31,12 +31,12 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 import org.apache.paimon.utils.IOUtils;
+import org.apache.paimon.utils.TimeUtils;
 
 import com.klarna.hiverunner.HiveShell;
 import com.klarna.hiverunner.annotations.HiveSQL;
 import org.apache.flink.core.fs.FSDataInputStream;
 import org.apache.flink.core.fs.Path;
-import org.apache.flink.streaming.api.environment.ExecutionCheckpointingOptions;
 import org.apache.flink.table.api.EnvironmentSettings;
 import org.apache.flink.table.api.TableEnvironment;
 import org.apache.flink.table.api.TableResult;
@@ -139,7 +139,9 @@ private void registerHiveCatalog(String catalogName, Map<String, String> catalog
                         EnvironmentSettings.newInstance().inStreamingMode().build());
         sEnv.getConfig()
                 .getConfiguration()
-                .set(ExecutionCheckpointingOptions.CHECKPOINTING_INTERVAL, Duration.ofSeconds(1));
+                .setString(
+                        "execution.checkpointing.interval",
+                        TimeUtils.formatWithHighestUnit(Duration.ofSeconds(1)));
         sEnv.getConfig().set(ExecutionConfigOptions.TABLE_EXEC_RESOURCE_DEFAULT_PARALLELISM, 1);
 
         tEnv.executeSql(

From a8a3751ab9ad62aba6d6ba93d2e7d2dbc4b532e7 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 26 Nov 2024 14:57:29 +0800
Subject: [PATCH 063/157] [doc] Fix doc with trino engine

---
 docs/content/engines/presto.md   | 321 -------------------------------
 docs/content/engines/trino.md    |  61 +++---
 docs/content/project/download.md |  10 +-
 3 files changed, 27 insertions(+), 365 deletions(-)
 delete mode 100644 docs/content/engines/presto.md

diff --git a/docs/content/engines/presto.md b/docs/content/engines/presto.md
deleted file mode 100644
index c336226bcf0a9..0000000000000
--- a/docs/content/engines/presto.md
+++ /dev/null
@@ -1,321 +0,0 @@
----
-title: "Presto"
-weight: 6
-type: docs
-aliases:
-- /engines/presto.html
----
-<!--
-Licensed to the Apache Software Foundation (ASF) under one
-or more contributor license agreements.  See the NOTICE file
-distributed with this work for additional information
-regarding copyright ownership.  The ASF licenses this file
-to you under the Apache License, Version 2.0 (the
-"License"); you may not use this file except in compliance
-with the License.  You may obtain a copy of the License at
-
-  http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing,
-software distributed under the License is distributed on an
-"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-KIND, either express or implied.  See the License for the
-specific language governing permissions and limitations
-under the License.
--->
-
-# Presto
-
-This documentation is a guide for using Paimon in Presto.
-
-## Version
-
-Paimon currently supports Presto 0.236 and above.
-
-## Preparing Paimon Jar File
-
-{{< stable >}}
-
-Download from master:
-https://paimon.apache.org/docs/master/project/download/
-
-{{< /stable >}}
-
-{{< unstable >}}
-
-| Version         | Jar                                                                                                                                                 |
-|-----------------|-----------------------------------------------------------------------------------------------------------------------------------------------------|
-| [0.236, 0.268)  | [paimon-presto-0.236-{{< version >}}-plugin.tar.gz](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.236/{{< version >}}/) |
-| [0.268, 0.273)  | [paimon-presto-0.268-{{< version >}}-plugin.tar.gz](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.268/{{< version >}}/) |
-| [0.273, latest] | [paimon-presto-0.273-{{< version >}}-plugin.tar.gz](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.273/{{< version >}}/) |
-
-{{< /unstable >}}
-
-You can also manually build a bundled jar from the source code.
-
-To build from the source code, [clone the git repository]({{< presto_github_repo >}}).
-
-Build presto connector plugin with the following command.
-
-```
-mvn clean install -DskipTests
-```
-
-After the packaging is complete, you can choose the corresponding connector based on your own Presto version:
-
-| Version         | Package                                                                          |
-|-----------------|----------------------------------------------------------------------------------|
-| [0.236, 0.268)  | `./paimon-presto-0.236/target/paimon-presto-0.236-{{< version >}}-plugin.tar.gz` |
-| [0.268, 0.273)  | `./paimon-presto-0.268/target/paimon-presto-0.268-{{< version >}}-plugin.tar.gz` |
-| [0.273, latest] | `./paimon-presto-0.273/target/paimon-presto-0.273-{{< version >}}-plugin.tar.gz` |
-
-Of course, we also support different versions of Hive and Hadoop. But note that we utilize
-Presto-shaded versions of Hive and Hadoop packages to address dependency conflicts.
-You can check the following two links to select the appropriate versions of Hive and Hadoop:
-
-[hadoop-apache2](https://mvnrepository.com/artifact/com.facebook.presto.hadoop/hadoop-apache2)
-
-[hive-apache](https://mvnrepository.com/artifact/com.facebook.presto.hive/hive-apache)
-
-Both Hive 2 and 3, as well as Hadoop 2 and 3, are supported.
-
-For example, if your presto version is 0.274, hive and hadoop version is 2.x, you could run:
-
-```bash
-mvn clean install -DskipTests -am -pl paimon-presto-0.273 -Dpresto.version=0.274 -Dhadoop.apache2.version=2.7.4-9 -Dhive.apache.version=1.2.2-2
-```
-
-## Tmp Dir
-
-Paimon will unzip some jars to the tmp directory for codegen. By default, Presto will use `'/tmp'` as the temporary
-directory, but `'/tmp'` may be periodically deleted.
-
-You can configure this environment variable when Presto starts:
-```shell
--Djava.io.tmpdir=/path/to/other/tmpdir
-```
-
-Let Paimon use a secure temporary directory.
-
-## Configure Paimon Catalog
-
-### Install Paimon Connector
-
-```bash
-tar -zxf paimon-presto-${PRESTO_VERSION}/target/paimon-presto-${PRESTO_VERSION}-${PAIMON_VERSION}-plugin.tar.gz -C ${PRESTO_HOME}/plugin
-```
-
-Note that, the variable `PRESTO_VERSION` is module name, must be one of 0.236, 0.268, 0.273.
-
-### Configuration
-
-```bash
-cd ${PRESTO_HOME}
-mkdir -p etc/catalog
-```
-
-```properties
-connector.name=paimon
-# set your filesystem path, such as hdfs://namenode01:8020/path and s3://${YOUR_S3_BUCKET}/path
-warehouse=${YOUR_FS_PATH}
-```
-
-If you are using HDFS FileSystem, you will also need to do one more thing: choose one of the following ways to configure your HDFS:
-
-- set environment variable HADOOP_HOME.
-- set environment variable HADOOP_CONF_DIR.
-- configure `hadoop-conf-dir` in the properties.
-
-If you are using S3 FileSystem, you need to add `paimon-s3-${PAIMON_VERSION}.jar` in `${PRESTO_HOME}/plugin/paimon` and additionally configure the following properties in `paimon.properties`:
-
-```properties
-s3.endpoint=${YOUR_ENDPOINTS}
-s3.access-key=${YOUR_AK}
-s3.secret-key=${YOUR_SK}
-```
-
-**Query HiveCatalog table:**
-
-```bash
-vim etc/catalog/paimon.properties
-```
-
-and set the following config:
-
-```properties
-connector.name=paimon
-# set your filesystem path, such as hdfs://namenode01:8020/path and s3://${YOUR_S3_BUCKET}/path
-warehouse=${YOUR_FS_PATH}
-metastore=hive
-uri=thrift://${YOUR_HIVE_METASTORE}:9083
-```
-
-## Kerberos
-
-You can configure kerberos keytab file when using KERBEROS authentication in the properties.
-
-```
-security.kerberos.login.principal=hadoop-user
-security.kerberos.login.keytab=/etc/presto/hdfs.keytab
-```
-
-Keytab files must be distributed to every node in the cluster that runs Presto.
-
-## Create Schema
-
-```
-CREATE SCHEMA paimon.test_db;
-```
-
-## Create Table
-
-```
-CREATE TABLE paimon.test_db.orders (
-    order_key bigint,
-    order_status varchar,
-    total_price decimal(18,4),
-    order_date date
-)
-WITH (
-    file_format = 'ORC',
-    primary_key = ARRAY['order_key','order_date'],
-    partitioned_by = ARRAY['order_date'],
-    bucket = '2',
-    bucket_key = 'order_key',
-    changelog_producer = 'input'
-)
-```
-
-## Add Column
-
-```
-CREATE TABLE paimon.test_db.orders (
-    order_key bigint,
-    orders_tatus varchar,
-    total_price decimal(18,4),
-    order_date date
-)
-WITH (
-    file_format = 'ORC',
-    primary_key = ARRAY['order_key','order_date'],
-    partitioned_by = ARRAY['order_date'],
-    bucket = '2',
-    bucket_key = 'order_key',
-    changelog_producer = 'input'
-)
-
-ALTER TABLE paimon.test_db.orders ADD COLUMN "shipping_address varchar;
-```
-
-## Query
-
-```
-SELECT * FROM paimon.default.MyTable
-```
-
-## Presto to Paimon type mapping
-
-This section lists all supported type conversion between Presto and Paimon.
-All Presto's data types are available in package ` com.facebook.presto.common.type`.
-
-<table class="table table-bordered">
-    <thead>
-    <tr>
-      <th class="text-left" style="width: 10%">Presto Data Type</th>
-      <th class="text-left" style="width: 10%">Paimon Data Type</th>
-      <th class="text-left" style="width: 5%">Atomic Type</th>
-    </tr>
-    </thead>
-    <tbody>
-    <tr>
-      <td><code>RowType</code></td>
-      <td><code>RowType</code></td>
-      <td>false</td>
-    </tr>
-    <tr>
-      <td><code>MapType</code></td>
-      <td><code>MapType</code></td>
-      <td>false</td>
-    </tr>
-    <tr>
-      <td><code>ArrayType</code></td>
-      <td><code>ArrayType</code></td>
-      <td>false</td>
-    </tr>
-    <tr>
-      <td><code>BooleanType</code></td>
-      <td><code>BooleanType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>TinyintType</code></td>
-      <td><code>TinyIntType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>SmallintType</code></td>
-      <td><code>SmallIntType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>IntegerType</code></td>
-      <td><code>IntType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>BigintType</code></td>
-      <td><code>BigIntType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>RealType</code></td>
-      <td><code>FloatType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>DoubleType</code></td>
-      <td><code>DoubleType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>CharType(length)</code></td>
-      <td><code>CharType(length)</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>VarCharType(VarCharType.MAX_LENGTH)</code></td>
-      <td><code>VarCharType(VarCharType.MAX_LENGTH)</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>VarCharType(length)</code></td>
-      <td><code>VarCharType(length), length is less than VarCharType.MAX_LENGTH</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>DateType</code></td>
-      <td><code>DateType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>TimestampType</code></td>
-      <td><code>TimestampType</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>DecimalType(precision, scale)</code></td>
-      <td><code>DecimalType(precision, scale)</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>VarBinaryType(length)</code></td>
-      <td><code>VarBinaryType(length)</code></td>
-      <td>true</td>
-    </tr>
-    <tr>
-      <td><code>TimestampWithTimeZoneType</code></td>
-      <td><code>LocalZonedTimestampType</code></td>
-      <td>true</td>
-    </tr>
-    </tbody>
-</table>
diff --git a/docs/content/engines/trino.md b/docs/content/engines/trino.md
index 05fc47729d151..bef10f9d2870d 100644
--- a/docs/content/engines/trino.md
+++ b/docs/content/engines/trino.md
@@ -30,7 +30,7 @@ This documentation is a guide for using Paimon in Trino.
 
 ## Version
 
-Paimon currently supports Trino 420 and above.
+Paimon currently supports Trino 440.
 
 ## Filesystem
 
@@ -40,26 +40,12 @@ filesystems for Trino on Trino official website.
 
 ## Preparing Paimon Jar File
 
-{{< stable >}}
-
-Download from master:
-https://paimon.apache.org/docs/master/project/download/
-
-{{< /stable >}}
-
-{{< unstable >}}
-
-| Version       | Package                                                                                                                                       |
-|---------------|-----------------------------------------------------------------------------------------------------------------------------------------------|
-| [420, 426]    | [paimon-trino-420-{{< version >}}-plugin.tar.gz](https://repository.apache.org/snapshots/org/apache/paimon/paimon-trino-420/{{< version >}}/) |
-| [427, latest] | [paimon-trino-427-{{< version >}}-plugin.tar.gz](https://repository.apache.org/snapshots/org/apache/paimon/paimon-trino-427/{{< version >}}/) |
-
-{{< /unstable >}}
+[Download]({{< ref "project/download" >}})
 
 You can also manually build a bundled jar from the source code. However, there are a few preliminary steps that need to be taken before compiling:
 
 - To build from the source code, [clone the git repository]({{< trino_github_repo >}}).
-- Install JDK17 locally, and configure JDK17 as a global environment variable;
+- Install JDK21 locally, and configure JDK21 as a global environment variable;
 
 Then,you can build bundled jar with the following command:
 
@@ -78,28 +64,17 @@ For example, if you want to use Hadoop 3.3.5-1, you can use the following comman
 mvn clean install -DskipTests -Dhadoop.apache.version=3.3.5-1
 ```
 
-## Tmp Dir
-
-Paimon will unzip some jars to the tmp directory for codegen. By default, Trino will use `'/tmp'` as the temporary
-directory, but `'/tmp'` may be periodically deleted.
-
-You can configure this environment variable when Trino starts: 
-```shell
--Djava.io.tmpdir=/path/to/other/tmpdir
-```
-
-Let Paimon use a secure temporary directory.
-
 ## Configure Paimon Catalog
 
 ### Install Paimon Connector
 ```bash
 tar -zxf paimon-trino-<trino-version>-{{< version >}}-plugin.tar.gz -C ${TRINO_HOME}/plugin
 ```
-the variable `trino-version` is module name, must be one of 420, 427.
-> NOTE: For JDK 17, when Deploying Trino, should add jvm options: `--add-opens=java.base/sun.nio.ch=ALL-UNNAMED --add-opens=java.base/java.nio=ALL-UNNAMED`
+
+> NOTE: For JDK 21, when Deploying Trino, should add jvm options: `--add-opens=java.base/sun.nio.ch=ALL-UNNAMED --add-opens=java.base/java.nio=ALL-UNNAMED`
 
 ### Configure
+
 Catalogs are registered by creating a catalog properties file in the etc/catalog directory. For example, create etc/catalog/paimon.properties with the following contents to mount the paimon connector as the paimon catalog:
 
 ```
@@ -186,9 +161,6 @@ SELECT * FROM paimon.test_db.orders
 ```
 
 ## Query with Time Traveling
-{{< tabs "time-travel-example" >}}
-
-{{< tab "version >=420" >}}
 
 ```sql
 -- read the snapshot from specified timestamp
@@ -208,10 +180,15 @@ you have a tag named '1' based on snapshot 2, the statement `SELECT * FROM paimo
 instead of snapshot 1.
 {{< /hint >}}
 
-{{< /tab >}}
+## Insert
 
+```
+INSERT INTO paimon.test_db.orders VALUES (.....);
+```
 
-{{< /tabs >}}
+Supports:
+- primary key table with fixed bucket.
+- non-primary-key table with bucket -1.
 
 ## Trino to Paimon type mapping
 
@@ -319,3 +296,15 @@ All Trino's data types are available in package `io.trino.spi.type`.
     </tr>
     </tbody>
 </table>
+
+## Tmp Dir
+
+Paimon will unzip some jars to the tmp directory for codegen. By default, Trino will use `'/tmp'` as the temporary
+directory, but `'/tmp'` may be periodically deleted.
+
+You can configure this environment variable when Trino starts:
+```shell
+-Djava.io.tmpdir=/path/to/other/tmpdir
+```
+
+Let Paimon use a secure temporary directory.
diff --git a/docs/content/project/download.md b/docs/content/project/download.md
index 5e49811076a6b..23d0112b09a2b 100644
--- a/docs/content/project/download.md
+++ b/docs/content/project/download.md
@@ -49,13 +49,8 @@ This documentation is a guide for downloading Paimon Jars.
 | Hive 2.3         | [paimon-hive-connector-2.3-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-hive-connector-2.3/{{< version >}}/)                 |
 | Hive 2.2         | [paimon-hive-connector-2.2-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-hive-connector-2.2/{{< version >}}/)                 |
 | Hive 2.1         | [paimon-hive-connector-2.1-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-hive-connector-2.1/{{< version >}}/)                 |
-| Hive 2.1-cdh-6.3 | [paimon-hive-connector-2.1-cdh-6.3-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-hive-connector-2.1-cdh-6.3/{{< version >}}/) |
-| Presto 0.236     | [paimon-presto-0.236-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.236/{{< version >}}/)                             |
-| Presto 0.268     | [paimon-presto-0.268-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.268/{{< version >}}/)                             |
-| Presto 0.273     | [paimon-presto-0.273-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-presto-0.273/{{< version >}}/)                             |
-| Presto SQL 332   | [paimon-prestosql-332-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-prestosql-332/{{< version >}}/)                           |
-| Trino 420        | [paimon-trino-420-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-trino-420/{{< version >}}/)                                   |
-| Trino 427        | [paimon-trino-427-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-trino-427/{{< version >}}/)                                   |
+| Hive 2.1-cdh-6.3 | [paimon-hive-connector-2.1-cdh-6.3-{{< version >}}.jar](https://repository.apache.org/snapshots/org/apache/paimon/paimon-hive-connector-2.1-cdh-6.3/{{< version >}}/) | |
+| Trino 440        | [paimon-trino-440-{{< version >}}-plugin.tar.gz](https://repository.apache.org/content/repositories/snapshots/org/apache/paimon/paimon-trino-440/{{< version >}}/)              |
 
 {{< /unstable >}}
 
@@ -79,7 +74,6 @@ This documentation is a guide for downloading Paimon Jars.
 | Hive 2.2         | [paimon-hive-connector-2.2-{{< version >}}.jar](https://repo.maven.apache.org/maven2/org/apache/paimon/paimon-hive-connector-2.2/{{< version >}}/paimon-hive-connector-2.2-{{< version >}}.jar)                         |
 | Hive 2.1         | [paimon-hive-connector-2.1-{{< version >}}.jar](https://repo.maven.apache.org/maven2/org/apache/paimon/paimon-hive-connector-2.1/{{< version >}}/paimon-hive-connector-2.1-{{< version >}}.jar)                         |
 | Hive 2.1-cdh-6.3 | [paimon-hive-connector-2.1-cdh-6.3-{{< version >}}.jar](https://repo.maven.apache.org/maven2/org/apache/paimon/paimon-hive-connector-2.1-cdh-6.3/{{< version >}}/paimon-hive-connector-2.1-cdh-6.3-{{< version >}}.jar) |
-| Presto           | [Download from master](https://paimon.apache.org/docs/master/project/download/)                                                                                                                                         |
 | Trino            | [Download from master](https://paimon.apache.org/docs/master/project/download/)                                                                                                                                         |
 
 {{< /stable >}}

From f822bec3b18f371a58e5d5a0d09421748e5ea3ce Mon Sep 17 00:00:00 2001
From: YeJunHao <41894543+leaves12138@users.noreply.github.com>
Date: Tue, 26 Nov 2024 15:47:28 +0800
Subject: [PATCH 064/157] [arrow][parquet] Add parquet field id for arrow
 schema. (#4582)

---
 .../org/apache/paimon/arrow/ArrowUtils.java   | 121 ++++++++++++++----
 .../apache/paimon/arrow/ArrowUtilsTest.java   |  96 ++++++++++++++
 2 files changed, 192 insertions(+), 25 deletions(-)
 create mode 100644 paimon-arrow/src/test/java/org/apache/paimon/arrow/ArrowUtilsTest.java

diff --git a/paimon-arrow/src/main/java/org/apache/paimon/arrow/ArrowUtils.java b/paimon-arrow/src/main/java/org/apache/paimon/arrow/ArrowUtils.java
index 0cf40ad9faae8..b3925a0a769e1 100644
--- a/paimon-arrow/src/main/java/org/apache/paimon/arrow/ArrowUtils.java
+++ b/paimon-arrow/src/main/java/org/apache/paimon/arrow/ArrowUtils.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.arrow.writer.ArrowFieldWriter;
 import org.apache.paimon.arrow.writer.ArrowFieldWriterFactoryVisitor;
 import org.apache.paimon.data.Timestamp;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
@@ -48,6 +49,7 @@
 import java.io.OutputStream;
 import java.time.Instant;
 import java.time.ZoneId;
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
@@ -56,6 +58,8 @@
 /** Utilities for creating Arrow objects. */
 public class ArrowUtils {
 
+    static final String PARQUET_FIELD_ID = "PARQUET:field_id";
+
     public static VectorSchemaRoot createVectorSchemaRoot(
             RowType rowType, BufferAllocator allocator) {
         return createVectorSchemaRoot(rowType, allocator, true);
@@ -69,7 +73,9 @@ public static VectorSchemaRoot createVectorSchemaRoot(
                                 f ->
                                         toArrowField(
                                                 allowUpperCase ? f.name() : f.name().toLowerCase(),
-                                                f.type()))
+                                                f.id(),
+                                                f.type(),
+                                                0))
                         .collect(Collectors.toList());
         return VectorSchemaRoot.create(new Schema(fields), allocator);
     }
@@ -78,40 +84,105 @@ public static FieldVector createVector(
             DataField dataField, BufferAllocator allocator, boolean allowUpperCase) {
         return toArrowField(
                         allowUpperCase ? dataField.name() : dataField.name().toLowerCase(),
-                        dataField.type())
+                        dataField.id(),
+                        dataField.type(),
+                        0)
                 .createVector(allocator);
     }
 
-    public static Field toArrowField(String fieldName, DataType dataType) {
+    public static Field toArrowField(String fieldName, int fieldId, DataType dataType, int depth) {
         FieldType fieldType = dataType.accept(ArrowFieldTypeConversion.ARROW_FIELD_TYPE_VISITOR);
+        fieldType =
+                new FieldType(
+                        fieldType.isNullable(),
+                        fieldType.getType(),
+                        fieldType.getDictionary(),
+                        Collections.singletonMap(PARQUET_FIELD_ID, String.valueOf(fieldId)));
         List<Field> children = null;
         if (dataType instanceof ArrayType) {
-            children =
-                    Collections.singletonList(
-                            toArrowField(
-                                    ListVector.DATA_VECTOR_NAME,
-                                    ((ArrayType) dataType).getElementType()));
+            Field field =
+                    toArrowField(
+                            ListVector.DATA_VECTOR_NAME,
+                            fieldId,
+                            ((ArrayType) dataType).getElementType(),
+                            depth + 1);
+            FieldType typeInner = field.getFieldType();
+            field =
+                    new Field(
+                            field.getName(),
+                            new FieldType(
+                                    typeInner.isNullable(),
+                                    typeInner.getType(),
+                                    typeInner.getDictionary(),
+                                    Collections.singletonMap(
+                                            PARQUET_FIELD_ID,
+                                            String.valueOf(
+                                                    SpecialFields.getArrayElementFieldId(
+                                                            fieldId, depth + 1)))),
+                            field.getChildren());
+            children = Collections.singletonList(field);
         } else if (dataType instanceof MapType) {
             MapType mapType = (MapType) dataType;
-            children =
-                    Collections.singletonList(
-                            new Field(
-                                    MapVector.DATA_VECTOR_NAME,
-                                    // data vector, key vector and value vector CANNOT be null
-                                    new FieldType(false, Types.MinorType.STRUCT.getType(), null),
-                                    Arrays.asList(
-                                            toArrowField(
-                                                    MapVector.KEY_NAME,
-                                                    mapType.getKeyType().notNull()),
-                                            toArrowField(
-                                                    MapVector.VALUE_NAME,
-                                                    mapType.getValueType().notNull()))));
+
+            Field keyField =
+                    toArrowField(
+                            MapVector.KEY_NAME, fieldId, mapType.getKeyType().notNull(), depth + 1);
+            FieldType keyType = keyField.getFieldType();
+            keyField =
+                    new Field(
+                            keyField.getName(),
+                            new FieldType(
+                                    keyType.isNullable(),
+                                    keyType.getType(),
+                                    keyType.getDictionary(),
+                                    Collections.singletonMap(
+                                            PARQUET_FIELD_ID,
+                                            String.valueOf(
+                                                    SpecialFields.getMapKeyFieldId(
+                                                            fieldId, depth + 1)))),
+                            keyField.getChildren());
+
+            Field valueField =
+                    toArrowField(
+                            MapVector.VALUE_NAME,
+                            fieldId,
+                            mapType.getValueType().notNull(),
+                            depth + 1);
+            FieldType valueType = valueField.getFieldType();
+            valueField =
+                    new Field(
+                            valueField.getName(),
+                            new FieldType(
+                                    valueType.isNullable(),
+                                    valueType.getType(),
+                                    valueType.getDictionary(),
+                                    Collections.singletonMap(
+                                            PARQUET_FIELD_ID,
+                                            String.valueOf(
+                                                    SpecialFields.getMapValueFieldId(
+                                                            fieldId, depth + 1)))),
+                            valueField.getChildren());
+
+            FieldType structType =
+                    new FieldType(
+                            false,
+                            Types.MinorType.STRUCT.getType(),
+                            null,
+                            Collections.singletonMap(PARQUET_FIELD_ID, String.valueOf(fieldId)));
+            Field mapField =
+                    new Field(
+                            MapVector.DATA_VECTOR_NAME,
+                            // data vector, key vector and value vector CANNOT be null
+                            structType,
+                            Arrays.asList(keyField, valueField));
+
+            children = Collections.singletonList(mapField);
         } else if (dataType instanceof RowType) {
             RowType rowType = (RowType) dataType;
-            children =
-                    rowType.getFields().stream()
-                            .map(f -> toArrowField(f.name(), f.type()))
-                            .collect(Collectors.toList());
+            children = new ArrayList<>();
+            for (DataField field : rowType.getFields()) {
+                children.add(toArrowField(field.name(), field.id(), field.type(), 0));
+            }
         }
         return new Field(fieldName, fieldType, children);
     }
diff --git a/paimon-arrow/src/test/java/org/apache/paimon/arrow/ArrowUtilsTest.java b/paimon-arrow/src/test/java/org/apache/paimon/arrow/ArrowUtilsTest.java
new file mode 100644
index 0000000000000..319df13ba10b3
--- /dev/null
+++ b/paimon-arrow/src/test/java/org/apache/paimon/arrow/ArrowUtilsTest.java
@@ -0,0 +1,96 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.arrow;
+
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.RowType;
+
+import org.apache.arrow.memory.RootAllocator;
+import org.apache.arrow.vector.types.pojo.Field;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.List;
+import java.util.Random;
+
+/** Test for {@link ArrowUtils}. */
+public class ArrowUtilsTest {
+
+    private static final Random RANDOM = new Random();
+
+    @Test
+    public void testParquetFieldId() {
+        Schema.Builder schemaBuilder = Schema.newBuilder();
+        schemaBuilder.column("f0", DataTypes.INT());
+        schemaBuilder.column("f1", DataTypes.INT());
+        schemaBuilder.column("f2", DataTypes.SMALLINT());
+        schemaBuilder.column("f3", DataTypes.STRING());
+        schemaBuilder.column("f4", DataTypes.DOUBLE());
+        schemaBuilder.column("f5", DataTypes.STRING());
+        schemaBuilder.column("F6", DataTypes.STRING());
+        schemaBuilder.column("f7", DataTypes.BOOLEAN());
+        schemaBuilder.column("f8", DataTypes.DATE());
+        schemaBuilder.column("f10", DataTypes.TIMESTAMP(6));
+        schemaBuilder.column("f11", DataTypes.DECIMAL(7, 2));
+        schemaBuilder.column("f12", DataTypes.BYTES());
+        schemaBuilder.column("f13", DataTypes.FLOAT());
+        schemaBuilder.column("f14", DataTypes.BINARY(10));
+        schemaBuilder.column("f15", DataTypes.VARBINARY(10));
+        schemaBuilder.column(
+                "f16",
+                DataTypes.ARRAY(
+                        DataTypes.ROW(
+                                DataTypes.FIELD(0, "f0", DataTypes.INT()),
+                                DataTypes.FIELD(1, "f1", DataTypes.SMALLINT()),
+                                DataTypes.FIELD(2, "f2", DataTypes.STRING()),
+                                DataTypes.FIELD(3, "f3", DataTypes.DOUBLE()),
+                                DataTypes.FIELD(4, "f4", DataTypes.BOOLEAN()),
+                                DataTypes.FIELD(5, "f5", DataTypes.DATE()),
+                                DataTypes.FIELD(6, "f6", DataTypes.TIMESTAMP(6)),
+                                DataTypes.FIELD(7, "f7", DataTypes.DECIMAL(7, 2)),
+                                DataTypes.FIELD(8, "f8", DataTypes.BYTES()),
+                                DataTypes.FIELD(9, "f9", DataTypes.FLOAT()),
+                                DataTypes.FIELD(10, "f10", DataTypes.BINARY(10)))));
+
+        RowType rowType = schemaBuilder.build().rowType();
+
+        List<Field> fields =
+                ArrowUtils.createVectorSchemaRoot(rowType, new RootAllocator())
+                        .getSchema()
+                        .getFields();
+
+        for (int i = 0; i < 16; i++) {
+            Assertions.assertThat(
+                            Integer.parseInt(
+                                    fields.get(i).getMetadata().get(ArrowUtils.PARQUET_FIELD_ID)))
+                    .isEqualTo(i);
+        }
+
+        fields = fields.get(15).getChildren().get(0).getChildren();
+        for (int i = 16; i < 26; i++) {
+            Assertions.assertThat(
+                            Integer.parseInt(
+                                    fields.get(i - 16)
+                                            .getMetadata()
+                                            .get(ArrowUtils.PARQUET_FIELD_ID)))
+                    .isEqualTo(i);
+        }
+    }
+}

From 408b78d0dfdd95263436e25a3312b482de714ecd Mon Sep 17 00:00:00 2001
From: Yann Byron <biyan900116@gmail.com>
Date: Tue, 26 Nov 2024 15:53:06 +0800
Subject: [PATCH 065/157] [spark] adjust paimon spark structure (#4573)

---
 .github/workflows/utitcase-spark-3.x.yml      |   2 +-
 .github/workflows/utitcase-spark-4.x.yml      |   2 +-
 .github/workflows/utitcase.yml                |   2 +-
 paimon-spark/paimon-spark-3.2/pom.xml         |  10 +-
 paimon-spark/paimon-spark-3.3/pom.xml         |  10 +-
 .../spark/sql/InsertOverwriteTest.scala       |   4 +-
 paimon-spark/paimon-spark-3.4/pom.xml         |  10 +-
 paimon-spark/paimon-spark-3.5/pom.xml         |  10 +-
 paimon-spark/paimon-spark-4.0/pom.xml         |  10 +-
 paimon-spark/paimon-spark-common/pom.xml      |  68 -------
 ...Row.java => AbstractSparkInternalRow.java} | 103 ++--------
 .../apache/paimon/spark/DataConverter.java    | 117 ++++++++++++
 .../apache/paimon/spark/SparkArrayData.java   | 172 -----------------
 .../paimon/spark/SparkGenericCatalog.java     |   5 +-
 .../spark/PaimonPartitionManagement.scala     |   3 +-
 .../paimon/spark/PaimonPartitionReader.scala  |   1 +
 .../spark/PaimonPartitionReaderFactory.scala  |   7 +-
 .../paimon/spark/PaimonStatistics.scala       |   7 +-
 .../spark/aggregate/LocalAggregator.scala     |   5 +-
 .../expressions/ExpressionHelper.scala        |  11 +-
 .../MergePaimonScalarSubqueriesBase.scala     |   4 +-
 .../spark/commands/BucketProcessor.scala      |   4 +-
 .../spark/commands/MergeIntoPaimonTable.scala |  13 +-
 .../commands/UpdatePaimonTableCommand.scala   |   7 +-
 .../paimon/spark/data/SparkArrayData.scala    | 118 ++++++++++++
 .../paimon/spark/data/SparkInternalRow.scala  |  36 ++++
 .../PaimonSparkSessionExtensions.scala        |   6 +-
 ...tractPaimonSparkSqlExtensionsParser.scala} |   4 +-
 .../catalog/PaimonCatalogUtils.scala          |  25 +--
 .../spark/sql/paimon/ReflectUtils.scala       |  43 +++++
 .../spark/sql/paimon/shims/SparkShim.scala    |  61 ++++++
 .../sql/paimon/shims/SparkShimLoader.scala    |  43 +++++
 paimon-spark/paimon-spark-ut/pom.xml          | 180 ++++++++++++++++++
 .../spark/SparkCatalogWithHiveTest.java       |   0
 .../paimon/spark/SparkFileIndexITCase.java    |   0
 .../spark/SparkFilterConverterTest.java       |   0
 .../paimon/spark/SparkGenericCatalogTest.java |   0
 .../SparkGenericCatalogWithHiveTest.java      |   0
 .../paimon/spark/SparkInternalRowTest.java    |   6 +-
 .../apache/paimon/spark/SparkReadITCase.java  |   0
 .../paimon/spark/SparkReadTestBase.java       |   0
 .../apache/paimon/spark/SparkS3ITCase.java    |   0
 .../spark/SparkSchemaEvolutionITCase.java     |   0
 .../paimon/spark/SparkTimeTravelITCase.java   |   0
 .../SparkTimeTravelWithDataFrameITCase.java   |   0
 .../apache/paimon/spark/SparkTypeTest.java    |   0
 .../apache/paimon/spark/SparkWriteITCase.java |   0
 .../spark/SparkWriteWithKyroITCase.java       |   0
 .../extensions/CallStatementParserTest.java   |   0
 .../org.junit.jupiter.api.extension.Extension |   0
 .../src/test/resources/hive-site.xml          |   0
 .../src/test/resources/log4j2-test.properties |   0
 .../paimon/spark/PaimonCDCSourceTest.scala    |   0
 .../paimon/spark/PaimonCommitTest.scala       |   0
 .../paimon/spark/PaimonHiveTestBase.scala     |   2 +-
 .../apache/paimon/spark/PaimonSinkTest.scala  |   0
 .../paimon/spark/PaimonSourceTest.scala       |   0
 .../paimon/spark/PaimonSparkTestBase.scala    |  39 +++-
 .../apache/paimon/spark/PaimonTableTest.scala |   0
 .../apache/paimon/spark/ScanHelperTest.scala  |   3 +-
 .../procedure/AlterBranchProcedureTest.scala  |   0
 .../spark/procedure/BranchProcedureTest.scala |   0
 .../CompactManifestProcedureTest.scala        |   0
 .../procedure/CompactProcedureTestBase.scala  |   0
 .../CreateAndDeleteTagProcedureTest.scala     |   0
 .../CreateTagFromTimestampProcedureTest.scala |   0
 .../ExpirePartitionsProcedureTest.scala       |   0
 .../ExpireSnapshotsProcedureTest.scala        |   0
 .../procedure/ExpireTagsProcedureTest.scala   |   0
 .../procedure/FastForwardProcedureTest.scala  |   0
 .../MarkPartitionDoneProcedureTest.scala      |   0
 .../MigrateDatabaseProcedureTest.scala        |   0
 .../procedure/MigrateFileProcedureTest.scala  |   0
 .../procedure/MigrateTableProcedureTest.scala |   0
 .../spark/procedure/ProcedureTestBase.scala   |   0
 .../RemoveOrphanFilesProcedureTest.scala      |   0
 .../procedure/ReplaceTagProcedureTest.scala   |   0
 .../procedure/RollbackProcedureTest.scala     |   0
 .../spark/sql/AnalyzeTableTestBase.scala      |  14 +-
 .../spark/sql/BucketedTableQueryTest.scala    |   8 +-
 .../apache/paimon/spark/sql/DDLTestBase.scala |  14 +-
 .../sql/DDLWithHiveCatalogTestBase.scala      |   2 +-
 .../paimon/spark/sql/DataFrameWriteTest.scala |   0
 .../spark/sql/DeleteFromTableTestBase.scala   |   0
 .../paimon/spark/sql/DeletionVectorTest.scala |   2 +-
 .../paimon/spark/sql/DescribeTableTest.scala  |   0
 ...leUnnecessaryPaimonBucketedScanSuite.scala |   6 +-
 .../spark/sql/DynamicBucketTableTest.scala    |   0
 .../sql/InsertOverwriteTableTestBase.scala    |   4 +-
 .../spark/sql/LookupCompactionTest.scala      |   0
 .../sql/MergeIntoNotMatchedBySourceTest.scala |   0
 .../spark/sql/MergeIntoTableTestBase.scala    |   0
 .../paimon/spark/sql/ObjectTableTest.scala    |   0
 .../PaimonCompositePartitionKeyTestBase.scala |   0
 .../paimon/spark/sql/PaimonFunctionTest.scala |   0
 .../paimon/spark/sql/PaimonMetricTest.scala   |   0
 .../sql/PaimonOptimizationTestBase.scala      |  35 ++--
 .../paimon/spark/sql/PaimonOptionTest.scala   |  26 +--
 .../sql/PaimonPartitionManagementTest.scala   |   0
 .../paimon/spark/sql/PaimonPushDownTest.scala |   0
 .../paimon/spark/sql/PaimonQueryTest.scala    |   2 +-
 .../spark/sql/PaimonShowColumnsTestBase.scala |   0
 .../spark/sql/PaimonSystemTableTest.scala     |   0
 .../spark/sql/PaimonTagDdlTestBase.scala      |   0
 .../paimon/spark/sql/PaimonViewTestBase.scala |   0
 .../spark/sql/PushDownAggregatesTest.scala    |   0
 .../spark/sql/SparkVersionSupport.scala       |   0
 .../spark/sql/TableValuedFunctionsTest.scala  |   0
 .../spark/sql/UpdateTableTestBase.scala       |   0
 .../paimon/spark/sql/WithTableOptions.scala   |   0
 .../org/apache/spark/sql}/paimon/Utils.scala  |  12 +-
 paimon-spark/paimon-spark3-common/pom.xml     |  32 +++-
 ...rg.apache.spark.sql.paimon.shims.SparkShim |  16 ++
 .../PaimonSpark3SqlExtensionsParser.scala     |  25 +++
 .../paimon/spark/data/Spark3ArrayData.scala}  |  15 +-
 .../spark/data/Spark3InternalRow.scala}       |  16 +-
 .../{shims.scala => shims/Spark3Shim.scala}   |  54 +++---
 paimon-spark/paimon-spark4-common/pom.xml     |  51 ++++-
 ...rg.apache.spark.sql.paimon.shims.SparkShim |  16 ++
 .../PaimonSpark4SqlExtensionsParser.scala     |  28 +++
 .../paimon/spark/data/Spark4ArrayData.scala}  |  13 +-
 .../paimon/spark/data/Spark4InternalRow.scala |  28 +++
 .../org/apache/spark/sql/paimon/shims.scala   |  86 ---------
 .../spark/sql/paimon/shims/Spark4Shim.scala   |  69 +++++++
 paimon-spark/pom.xml                          |  38 ++--
 125 files changed, 1138 insertions(+), 627 deletions(-)
 rename paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/{SparkInternalRow.java => AbstractSparkInternalRow.java} (67%)
 create mode 100644 paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/DataConverter.java
 delete mode 100644 paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkArrayData.java
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkArrayData.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkInternalRow.scala
 rename paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/{PaimonSparkSqlExtensionsParser.scala => AbstractPaimonSparkSqlExtensionsParser.scala} (98%)
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/ReflectUtils.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShimLoader.scala
 create mode 100644 paimon-spark/paimon-spark-ut/pom.xml
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkFilterConverterTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkGenericCatalogTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkGenericCatalogWithHiveTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java (95%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkReadITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkReadTestBase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkS3ITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkTimeTravelITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkTimeTravelWithDataFrameITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkTypeTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkWriteITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/SparkWriteWithKyroITCase.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/resources/META-INF/services/org.junit.jupiter.api.extension.Extension (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/resources/hive-site.xml (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/resources/log4j2-test.properties (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonCDCSourceTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonCommitTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala (98%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonSourceTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala (79%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/PaimonTableTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala (97%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/AlterBranchProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/BranchProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/CompactManifestProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/CreateAndDeleteTagProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/CreateTagFromTimestampProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/ExpireSnapshotsProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/ExpireTagsProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/FastForwardProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/MarkPartitionDoneProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/MigrateDatabaseProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/MigrateFileProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/MigrateTableProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/ReplaceTagProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/procedure/RollbackProcedureTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala (97%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala (97%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala (97%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala (99%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DeleteFromTableTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala (99%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala (97%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/DynamicBucketTableTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala (99%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/LookupCompactionTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/MergeIntoNotMatchedBySourceTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/MergeIntoTableTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/ObjectTableTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonCompositePartitionKeyTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonFunctionTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonMetricTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala (90%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala (91%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonPartitionManagementTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala (99%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonShowColumnsTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonTagDdlTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/SparkVersionSupport.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/UpdateTableTestBase.scala (100%)
 rename paimon-spark/{paimon-spark-common => paimon-spark-ut}/src/test/scala/org/apache/paimon/spark/sql/WithTableOptions.scala (100%)
 rename paimon-spark/{paimon-spark-common/src/test/scala/org/apache/spark => paimon-spark-ut/src/test/scala/org/apache/spark/sql}/paimon/Utils.scala (74%)
 create mode 100644 paimon-spark/paimon-spark3-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
 create mode 100644 paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark3SqlExtensionsParser.scala
 rename paimon-spark/{paimon-spark-3.2/src/test/scala/org/apache/spark/paimon/Utils.scala => paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3ArrayData.scala} (73%)
 rename paimon-spark/{paimon-spark-3.3/src/test/scala/org/apache/spark/paimon/Utils.scala => paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3InternalRow.scala} (73%)
 rename paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/{shims.scala => shims/Spark3Shim.scala} (51%)
 create mode 100644 paimon-spark/paimon-spark4-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
 create mode 100644 paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark4SqlExtensionsParser.scala
 rename paimon-spark/{paimon-spark-3.4/src/test/scala/org/apache/spark/paimon/Utils.scala => paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4ArrayData.scala} (72%)
 create mode 100644 paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4InternalRow.scala
 delete mode 100644 paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala
 create mode 100644 paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala

diff --git a/.github/workflows/utitcase-spark-3.x.yml b/.github/workflows/utitcase-spark-3.x.yml
index 5edcfe49007ac..2d3df5f4d0053 100644
--- a/.github/workflows/utitcase-spark-3.x.yml
+++ b/.github/workflows/utitcase-spark-3.x.yml
@@ -54,7 +54,7 @@ jobs:
           jvm_timezone=$(random_timezone)
           echo "JVM timezone is set to $jvm_timezone"
           test_modules=""
-          for suffix in common_2.12 3.5 3.4 3.3 3.2; do
+          for suffix in ut 3.5 3.4 3.3 3.2; do
           test_modules+="org.apache.paimon:paimon-spark-${suffix},"
           done
           test_modules="${test_modules%,}"
diff --git a/.github/workflows/utitcase-spark-4.x.yml b/.github/workflows/utitcase-spark-4.x.yml
index 7fbac23dda4fc..c58fd7c03be27 100644
--- a/.github/workflows/utitcase-spark-4.x.yml
+++ b/.github/workflows/utitcase-spark-4.x.yml
@@ -54,7 +54,7 @@ jobs:
           jvm_timezone=$(random_timezone)
           echo "JVM timezone is set to $jvm_timezone"
           test_modules=""
-          for suffix in common_2.13 4.0; do
+          for suffix in ut 4.0; do
           test_modules+="org.apache.paimon:paimon-spark-${suffix},"
           done
           test_modules="${test_modules%,}"
diff --git a/.github/workflows/utitcase.yml b/.github/workflows/utitcase.yml
index bde67cb4c2039..8aa33f5b8218e 100644
--- a/.github/workflows/utitcase.yml
+++ b/.github/workflows/utitcase.yml
@@ -54,7 +54,7 @@ jobs:
           jvm_timezone=$(random_timezone)
           echo "JVM timezone is set to $jvm_timezone"
           test_modules="!paimon-e2e-tests,"
-          for suffix in 3.5 3.4 3.3 3.2 common_2.12; do
+          for suffix in 3.5 3.4 3.3 3.2 ut; do
           test_modules+="!org.apache.paimon:paimon-spark-${suffix},"
           done
           test_modules="${test_modules%,}"
diff --git a/paimon-spark/paimon-spark-3.2/pom.xml b/paimon-spark/paimon-spark-3.2/pom.xml
index 626bb5bae8330..957319b47dab8 100644
--- a/paimon-spark/paimon-spark-3.2/pom.xml
+++ b/paimon-spark/paimon-spark-3.2/pom.xml
@@ -36,6 +36,12 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark3-common</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
@@ -63,7 +69,7 @@ under the License.
 
         <dependency>
             <groupId>org.apache.paimon</groupId>
-            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <artifactId>paimon-spark-ut</artifactId>
             <version>${project.version}</version>
             <classifier>tests</classifier>
             <scope>test</scope>
@@ -126,7 +132,7 @@ under the License.
                             </filters>
                             <artifactSet>
                                 <includes combine.children="append">
-                                     <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                     <include>org.apache.paimon:paimon-spark3-common</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
diff --git a/paimon-spark/paimon-spark-3.3/pom.xml b/paimon-spark/paimon-spark-3.3/pom.xml
index 689e4131ccd9e..0a390d9267894 100644
--- a/paimon-spark/paimon-spark-3.3/pom.xml
+++ b/paimon-spark/paimon-spark-3.3/pom.xml
@@ -36,6 +36,12 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark3-common</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
@@ -63,7 +69,7 @@ under the License.
 
         <dependency>
             <groupId>org.apache.paimon</groupId>
-            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <artifactId>paimon-spark-ut</artifactId>
             <version>${project.version}</version>
             <classifier>tests</classifier>
             <scope>test</scope>
@@ -126,7 +132,7 @@ under the License.
                             </filters>
                             <artifactSet>
                                 <includes combine.children="append">
-                                     <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                     <include>org.apache.paimon:paimon-spark3-common</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
diff --git a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTest.scala b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTest.scala
index 304b814b33d38..219d57c865c8c 100644
--- a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTest.scala
+++ b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTest.scala
@@ -248,7 +248,7 @@ class InsertOverwriteTest extends PaimonSparkTestBase {
               spark.sql("SELECT * FROM T ORDER BY a, b"),
               Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
 
-            withSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
+            withSparkSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
               // dynamic overwrite the a=1 partition
               spark.sql("INSERT OVERWRITE T VALUES (1, 5, '5'), (1, 7, '7')")
               checkAnswer(
@@ -289,7 +289,7 @@ class InsertOverwriteTest extends PaimonSparkTestBase {
                 "ptv2",
                 22) :: Nil)
 
-            withSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
+            withSparkSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
               // dynamic overwrite the pt2=22 partition
               spark.sql(
                 "INSERT OVERWRITE T PARTITION (pt2 = 22) VALUES (3, 'c2', 'ptv1'), (4, 'd2', 'ptv3')")
diff --git a/paimon-spark/paimon-spark-3.4/pom.xml b/paimon-spark/paimon-spark-3.4/pom.xml
index d1ded508a927c..0f4cb30e4f7f6 100644
--- a/paimon-spark/paimon-spark-3.4/pom.xml
+++ b/paimon-spark/paimon-spark-3.4/pom.xml
@@ -36,6 +36,12 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark3-common</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
@@ -63,7 +69,7 @@ under the License.
 
         <dependency>
             <groupId>org.apache.paimon</groupId>
-            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <artifactId>paimon-spark-ut</artifactId>
             <version>${project.version}</version>
             <classifier>tests</classifier>
             <scope>test</scope>
@@ -126,7 +132,7 @@ under the License.
                             </filters>
                             <artifactSet>
                                 <includes combine.children="append">
-                                     <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                     <include>org.apache.paimon:paimon-spark3-common</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
diff --git a/paimon-spark/paimon-spark-3.5/pom.xml b/paimon-spark/paimon-spark-3.5/pom.xml
index 92803cda540e4..1b9c968889083 100644
--- a/paimon-spark/paimon-spark-3.5/pom.xml
+++ b/paimon-spark/paimon-spark-3.5/pom.xml
@@ -36,6 +36,12 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark3-common</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
@@ -63,7 +69,7 @@ under the License.
 
         <dependency>
             <groupId>org.apache.paimon</groupId>
-            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <artifactId>paimon-spark-ut</artifactId>
             <version>${project.version}</version>
             <classifier>tests</classifier>
             <scope>test</scope>
@@ -126,7 +132,7 @@ under the License.
                             </filters>
                             <artifactSet>
                                 <includes combine.children="append">
-                                     <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                     <include>org.apache.paimon:paimon-spark3-common</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
diff --git a/paimon-spark/paimon-spark-4.0/pom.xml b/paimon-spark/paimon-spark-4.0/pom.xml
index 9f819f820ce2c..8e7d166dc55b5 100644
--- a/paimon-spark/paimon-spark-4.0/pom.xml
+++ b/paimon-spark/paimon-spark-4.0/pom.xml
@@ -36,6 +36,12 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark4-common</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
@@ -63,7 +69,7 @@ under the License.
 
         <dependency>
             <groupId>org.apache.paimon</groupId>
-            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <artifactId>paimon-spark-ut</artifactId>
             <version>${project.version}</version>
             <classifier>tests</classifier>
             <scope>test</scope>
@@ -126,7 +132,7 @@ under the License.
                             </filters>
                             <artifactSet>
                                 <includes combine.children="append">
-                                     <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                     <include>org.apache.paimon:paimon-spark4-common</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
diff --git a/paimon-spark/paimon-spark-common/pom.xml b/paimon-spark/paimon-spark-common/pom.xml
index 1cfc53f42d489..052c4c4265fc4 100644
--- a/paimon-spark/paimon-spark-common/pom.xml
+++ b/paimon-spark/paimon-spark-common/pom.xml
@@ -38,18 +38,6 @@ under the License.
     </properties>
 
     <dependencies>
-        <dependency>
-            <groupId>org.apache.paimon</groupId>
-            <artifactId>${paimon-sparkx-common}</artifactId>
-            <version>${project.version}</version>
-            <exclusions>
-                <exclusion>
-                    <groupId>*</groupId>
-                    <artifactId>*</artifactId>
-                </exclusion>
-            </exclusions>
-        </dependency>
-
         <dependency>
             <groupId>org.apache.spark</groupId>
             <artifactId>spark-sql_${scala.binary.version}</artifactId>
@@ -72,46 +60,6 @@ under the License.
             <groupId>org.apache.paimon</groupId>
             <artifactId>paimon-bundle</artifactId>
         </dependency>
-
-       <!-- test -->
-
-        <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-sql_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
-            <classifier>tests</classifier>
-            <scope>test</scope>
-        </dependency>
-
-        <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-catalyst_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
-            <classifier>tests</classifier>
-            <scope>test</scope>
-        </dependency>
-
-        <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-core_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
-            <classifier>tests</classifier>
-            <scope>test</scope>
-        </dependency>
-
-        <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-hive_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
-            <scope>test</scope>
-        </dependency>
-
-        <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-avro_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
-            <scope>test</scope>
-        </dependency>
     </dependencies>
 
     <build>
@@ -130,7 +78,6 @@ under the License.
                             <artifactSet>
                                 <includes combine.children="append">
                                     <include>org.apache.paimon:paimon-bundle</include>
-                                    <include>org.apache.paimon:${paimon-sparkx-common}</include>
                                 </includes>
                             </artifactSet>
                         </configuration>
@@ -155,21 +102,6 @@ under the License.
                     <sourceDirectory>src/main/antlr4</sourceDirectory>
                 </configuration>
             </plugin>
-
-            <!-- Used for submodules to utilize the test code -->
-            <plugin>
-                <groupId>org.apache.maven.plugins</groupId>
-                <artifactId>maven-jar-plugin</artifactId>
-                <executions>
-                    <execution>
-                        <id>prepare-test-jar</id>
-                        <phase>test-compile</phase>
-                        <goals>
-                            <goal>test-jar</goal>
-                        </goals>
-                    </execution>
-                </executions>
-            </plugin>
         </plugins>
     </build>
 </project>
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkInternalRow.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/AbstractSparkInternalRow.java
similarity index 67%
rename from paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkInternalRow.java
rename to paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/AbstractSparkInternalRow.java
index 147c6c2d77c84..28604a6d62933 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkInternalRow.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/AbstractSparkInternalRow.java
@@ -18,24 +18,15 @@
 
 package org.apache.paimon.spark;
 
-import org.apache.paimon.data.BinaryString;
-import org.apache.paimon.data.InternalArray;
-import org.apache.paimon.data.InternalMap;
 import org.apache.paimon.data.InternalRow;
-import org.apache.paimon.data.Timestamp;
-import org.apache.paimon.spark.util.shim.TypeUtils;
+import org.apache.paimon.spark.data.SparkInternalRow;
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.BigIntType;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DataTypeChecks;
-import org.apache.paimon.types.IntType;
-import org.apache.paimon.types.MapType;
-import org.apache.paimon.types.MultisetType;
 import org.apache.paimon.types.RowType;
 
-import org.apache.spark.sql.catalyst.util.ArrayBasedMapData;
 import org.apache.spark.sql.catalyst.util.ArrayData;
-import org.apache.spark.sql.catalyst.util.DateTimeUtils;
 import org.apache.spark.sql.catalyst.util.MapData;
 import org.apache.spark.sql.types.BinaryType;
 import org.apache.spark.sql.types.BooleanType;
@@ -61,19 +52,23 @@
 
 import java.util.Objects;
 
+import static org.apache.paimon.spark.DataConverter.fromPaimon;
 import static org.apache.paimon.utils.InternalRowUtils.copyInternalRow;
 
-/** Spark {@link org.apache.spark.sql.catalyst.InternalRow} to wrap {@link InternalRow}. */
-public class SparkInternalRow extends org.apache.spark.sql.paimon.shims.InternalRow {
+/**
+ * An abstract {@link SparkInternalRow} that overwrite all the common methods in spark3 and spark4.
+ */
+public abstract class AbstractSparkInternalRow extends SparkInternalRow {
 
-    private final RowType rowType;
+    protected RowType rowType;
 
-    private InternalRow row;
+    protected InternalRow row;
 
-    public SparkInternalRow(RowType rowType) {
+    public AbstractSparkInternalRow(RowType rowType) {
         this.rowType = rowType;
     }
 
+    @Override
     public SparkInternalRow replace(InternalRow row) {
         this.row = row;
         return this;
@@ -96,7 +91,7 @@ public void update(int i, Object value) {
 
     @Override
     public org.apache.spark.sql.catalyst.InternalRow copy() {
-        return new SparkInternalRow(rowType).replace(copyInternalRow(row, rowType));
+        return SparkInternalRow.create(rowType).replace(copyInternalRow(row, rowType));
     }
 
     @Override
@@ -255,7 +250,7 @@ public boolean equals(Object o) {
         if (o == null || getClass() != o.getClass()) {
             return false;
         }
-        SparkInternalRow that = (SparkInternalRow) o;
+        AbstractSparkInternalRow that = (AbstractSparkInternalRow) o;
         return Objects.equals(rowType, that.rowType) && Objects.equals(row, that.row);
     }
 
@@ -263,78 +258,4 @@ public boolean equals(Object o) {
     public int hashCode() {
         return Objects.hash(rowType, row);
     }
-
-    // ================== static methods =========================================
-
-    public static Object fromPaimon(Object o, DataType type) {
-        if (o == null) {
-            return null;
-        }
-        switch (type.getTypeRoot()) {
-            case TIMESTAMP_WITHOUT_TIME_ZONE:
-            case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
-                return fromPaimon((Timestamp) o);
-            case CHAR:
-            case VARCHAR:
-                return fromPaimon((BinaryString) o);
-            case DECIMAL:
-                return fromPaimon((org.apache.paimon.data.Decimal) o);
-            case ARRAY:
-                return fromPaimon((InternalArray) o, (ArrayType) type);
-            case MAP:
-            case MULTISET:
-                return fromPaimon((InternalMap) o, type);
-            case ROW:
-                return fromPaimon((InternalRow) o, (RowType) type);
-            default:
-                return o;
-        }
-    }
-
-    public static UTF8String fromPaimon(BinaryString string) {
-        return UTF8String.fromBytes(string.toBytes());
-    }
-
-    public static Decimal fromPaimon(org.apache.paimon.data.Decimal decimal) {
-        return Decimal.apply(decimal.toBigDecimal());
-    }
-
-    public static org.apache.spark.sql.catalyst.InternalRow fromPaimon(
-            InternalRow row, RowType rowType) {
-        return new SparkInternalRow(rowType).replace(row);
-    }
-
-    public static long fromPaimon(Timestamp timestamp) {
-        if (TypeUtils.treatPaimonTimestampTypeAsSparkTimestampType()) {
-            return DateTimeUtils.fromJavaTimestamp(timestamp.toSQLTimestamp());
-        } else {
-            return timestamp.toMicros();
-        }
-    }
-
-    public static ArrayData fromPaimon(InternalArray array, ArrayType arrayType) {
-        return fromPaimonArrayElementType(array, arrayType.getElementType());
-    }
-
-    private static ArrayData fromPaimonArrayElementType(InternalArray array, DataType elementType) {
-        return new SparkArrayData(elementType).replace(array);
-    }
-
-    public static MapData fromPaimon(InternalMap map, DataType mapType) {
-        DataType keyType;
-        DataType valueType;
-        if (mapType instanceof MapType) {
-            keyType = ((MapType) mapType).getKeyType();
-            valueType = ((MapType) mapType).getValueType();
-        } else if (mapType instanceof MultisetType) {
-            keyType = ((MultisetType) mapType).getElementType();
-            valueType = new IntType();
-        } else {
-            throw new UnsupportedOperationException("Unsupported type: " + mapType);
-        }
-
-        return new ArrayBasedMapData(
-                fromPaimonArrayElementType(map.keyArray(), keyType),
-                fromPaimonArrayElementType(map.valueArray(), valueType));
-    }
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/DataConverter.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/DataConverter.java
new file mode 100644
index 0000000000000..0b5ea899476eb
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/DataConverter.java
@@ -0,0 +1,117 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark;
+
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.data.InternalArray;
+import org.apache.paimon.data.InternalMap;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.Timestamp;
+import org.apache.paimon.spark.data.SparkArrayData;
+import org.apache.paimon.spark.data.SparkInternalRow;
+import org.apache.paimon.spark.util.shim.TypeUtils;
+import org.apache.paimon.types.ArrayType;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.IntType;
+import org.apache.paimon.types.MapType;
+import org.apache.paimon.types.MultisetType;
+import org.apache.paimon.types.RowType;
+
+import org.apache.spark.sql.catalyst.util.ArrayBasedMapData;
+import org.apache.spark.sql.catalyst.util.ArrayData;
+import org.apache.spark.sql.catalyst.util.DateTimeUtils;
+import org.apache.spark.sql.catalyst.util.MapData;
+import org.apache.spark.sql.types.Decimal;
+import org.apache.spark.unsafe.types.UTF8String;
+
+/** A data converter that convert Paimon data to Spark Data. */
+public class DataConverter {
+
+    public static Object fromPaimon(Object o, DataType type) {
+        if (o == null) {
+            return null;
+        }
+        switch (type.getTypeRoot()) {
+            case TIMESTAMP_WITHOUT_TIME_ZONE:
+            case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
+                return fromPaimon((Timestamp) o);
+            case CHAR:
+            case VARCHAR:
+                return fromPaimon((BinaryString) o);
+            case DECIMAL:
+                return fromPaimon((org.apache.paimon.data.Decimal) o);
+            case ARRAY:
+                return fromPaimon((InternalArray) o, (ArrayType) type);
+            case MAP:
+            case MULTISET:
+                return fromPaimon((InternalMap) o, type);
+            case ROW:
+                return fromPaimon((InternalRow) o, (RowType) type);
+            default:
+                return o;
+        }
+    }
+
+    public static UTF8String fromPaimon(BinaryString string) {
+        return UTF8String.fromBytes(string.toBytes());
+    }
+
+    public static Decimal fromPaimon(org.apache.paimon.data.Decimal decimal) {
+        return Decimal.apply(decimal.toBigDecimal());
+    }
+
+    public static org.apache.spark.sql.catalyst.InternalRow fromPaimon(
+            InternalRow row, RowType rowType) {
+        return SparkInternalRow.create(rowType).replace(row);
+    }
+
+    public static long fromPaimon(Timestamp timestamp) {
+        if (TypeUtils.treatPaimonTimestampTypeAsSparkTimestampType()) {
+            return DateTimeUtils.fromJavaTimestamp(timestamp.toSQLTimestamp());
+        } else {
+            return timestamp.toMicros();
+        }
+    }
+
+    public static ArrayData fromPaimon(InternalArray array, ArrayType arrayType) {
+        return fromPaimonArrayElementType(array, arrayType.getElementType());
+    }
+
+    private static ArrayData fromPaimonArrayElementType(InternalArray array, DataType elementType) {
+        return SparkArrayData.create(elementType).replace(array);
+    }
+
+    public static MapData fromPaimon(InternalMap map, DataType mapType) {
+        DataType keyType;
+        DataType valueType;
+        if (mapType instanceof MapType) {
+            keyType = ((MapType) mapType).getKeyType();
+            valueType = ((MapType) mapType).getValueType();
+        } else if (mapType instanceof MultisetType) {
+            keyType = ((MultisetType) mapType).getElementType();
+            valueType = new IntType();
+        } else {
+            throw new UnsupportedOperationException("Unsupported type: " + mapType);
+        }
+
+        return new ArrayBasedMapData(
+                fromPaimonArrayElementType(map.keyArray(), keyType),
+                fromPaimonArrayElementType(map.valueArray(), valueType));
+    }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkArrayData.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkArrayData.java
deleted file mode 100644
index 9934047a18251..0000000000000
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkArrayData.java
+++ /dev/null
@@ -1,172 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.spark;
-
-import org.apache.paimon.data.InternalArray;
-import org.apache.paimon.types.ArrayType;
-import org.apache.paimon.types.BigIntType;
-import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypeChecks;
-import org.apache.paimon.types.RowType;
-import org.apache.paimon.utils.InternalRowUtils;
-
-import org.apache.spark.sql.catalyst.InternalRow;
-import org.apache.spark.sql.catalyst.expressions.SpecializedGettersReader;
-import org.apache.spark.sql.catalyst.util.ArrayData;
-import org.apache.spark.sql.catalyst.util.MapData;
-import org.apache.spark.sql.types.Decimal;
-import org.apache.spark.unsafe.types.CalendarInterval;
-import org.apache.spark.unsafe.types.UTF8String;
-
-import static org.apache.paimon.spark.SparkInternalRow.fromPaimon;
-import static org.apache.paimon.utils.InternalRowUtils.copyArray;
-
-/** Spark {@link ArrayData} to wrap Paimon {@link InternalArray}. */
-public class SparkArrayData extends org.apache.spark.sql.paimon.shims.ArrayData {
-
-    private final DataType elementType;
-
-    private InternalArray array;
-
-    public SparkArrayData(DataType elementType) {
-        this.elementType = elementType;
-    }
-
-    public SparkArrayData replace(InternalArray array) {
-        this.array = array;
-        return this;
-    }
-
-    @Override
-    public int numElements() {
-        return array.size();
-    }
-
-    @Override
-    public ArrayData copy() {
-        return new SparkArrayData(elementType).replace(copyArray(array, elementType));
-    }
-
-    @Override
-    public Object[] array() {
-        Object[] objects = new Object[numElements()];
-        for (int i = 0; i < objects.length; i++) {
-            objects[i] = fromPaimon(InternalRowUtils.get(array, i, elementType), elementType);
-        }
-        return objects;
-    }
-
-    @Override
-    public void setNullAt(int i) {
-        throw new UnsupportedOperationException();
-    }
-
-    @Override
-    public void update(int i, Object value) {
-        throw new UnsupportedOperationException();
-    }
-
-    @Override
-    public boolean isNullAt(int ordinal) {
-        return array.isNullAt(ordinal);
-    }
-
-    @Override
-    public boolean getBoolean(int ordinal) {
-        return array.getBoolean(ordinal);
-    }
-
-    @Override
-    public byte getByte(int ordinal) {
-        return array.getByte(ordinal);
-    }
-
-    @Override
-    public short getShort(int ordinal) {
-        return array.getShort(ordinal);
-    }
-
-    @Override
-    public int getInt(int ordinal) {
-        return array.getInt(ordinal);
-    }
-
-    @Override
-    public long getLong(int ordinal) {
-        if (elementType instanceof BigIntType) {
-            return array.getLong(ordinal);
-        }
-
-        return getTimestampMicros(ordinal);
-    }
-
-    private long getTimestampMicros(int ordinal) {
-        return fromPaimon(array.getTimestamp(ordinal, DataTypeChecks.getPrecision(elementType)));
-    }
-
-    @Override
-    public float getFloat(int ordinal) {
-        return array.getFloat(ordinal);
-    }
-
-    @Override
-    public double getDouble(int ordinal) {
-        return array.getDouble(ordinal);
-    }
-
-    @Override
-    public Decimal getDecimal(int ordinal, int precision, int scale) {
-        return fromPaimon(array.getDecimal(ordinal, precision, scale));
-    }
-
-    @Override
-    public UTF8String getUTF8String(int ordinal) {
-        return fromPaimon(array.getString(ordinal));
-    }
-
-    @Override
-    public byte[] getBinary(int ordinal) {
-        return array.getBinary(ordinal);
-    }
-
-    @Override
-    public CalendarInterval getInterval(int ordinal) {
-        throw new UnsupportedOperationException();
-    }
-
-    @Override
-    public InternalRow getStruct(int ordinal, int numFields) {
-        return fromPaimon(array.getRow(ordinal, numFields), (RowType) elementType);
-    }
-
-    @Override
-    public ArrayData getArray(int ordinal) {
-        return fromPaimon(array.getArray(ordinal), (ArrayType) elementType);
-    }
-
-    @Override
-    public MapData getMap(int ordinal) {
-        return fromPaimon(array.getMap(ordinal), elementType);
-    }
-
-    @Override
-    public Object get(int ordinal, org.apache.spark.sql.types.DataType dataType) {
-        return SpecializedGettersReader.read(this, ordinal, dataType, true, true);
-    }
-}
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
index d4b712fcb8ee0..9957f0cdf91ff 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
@@ -52,7 +52,7 @@
 import org.apache.spark.sql.internal.SQLConf;
 import org.apache.spark.sql.internal.SessionState;
 import org.apache.spark.sql.internal.StaticSQLConf;
-import org.apache.spark.sql.paimon.shims;
+import org.apache.spark.sql.paimon.shims.SparkShimLoader;
 import org.apache.spark.sql.types.StructType;
 import org.apache.spark.sql.util.CaseInsensitiveStringMap;
 import org.slf4j.Logger;
@@ -203,7 +203,8 @@ public Table createTable(
             return sparkCatalog.createTable(ident, schema, partitions, properties);
         } else {
             // delegate to the session catalog
-            return shims.createTable(asTableCatalog(), ident, schema, partitions, properties);
+            return SparkShimLoader.getSparkShim()
+                    .createTable(asTableCatalog(), ident, schema, partitions, properties);
         }
     }
 
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
index 54970bfe3cb21..9a305ca59a0f1 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
@@ -21,6 +21,7 @@ package org.apache.paimon.spark
 import org.apache.paimon.CoreOptions
 import org.apache.paimon.metastore.MetastoreClient
 import org.apache.paimon.operation.FileStoreCommit
+import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.table.FileStoreTable
 import org.apache.paimon.table.sink.BatchWriteBuilder
 import org.apache.paimon.types.RowType
@@ -116,7 +117,7 @@ trait PaimonPartitionManagement extends SupportsAtomicPartitionManagement {
         s"the partition schema '${partitionSchema.sql}'."
     )
     table.newReadBuilder.newScan.listPartitions.asScala
-      .map(binaryRow => SparkInternalRow.fromPaimon(binaryRow, partitionRowType))
+      .map(binaryRow => DataConverter.fromPaimon(binaryRow, partitionRowType))
       .filter(
         sparkInternalRow => {
           partitionCols.zipWithIndex
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReader.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReader.scala
index fa9072df31499..526178e28ec33 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReader.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReader.scala
@@ -20,6 +20,7 @@ package org.apache.paimon.spark
 
 import org.apache.paimon.data.{InternalRow => PaimonInternalRow}
 import org.apache.paimon.reader.RecordReader
+import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.spark.schema.PaimonMetadataColumn
 import org.apache.paimon.table.source.{DataSplit, Split}
 
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReaderFactory.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReaderFactory.scala
index 94de0bec3b506..59b07a7944811 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReaderFactory.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionReaderFactory.scala
@@ -18,10 +18,11 @@
 
 package org.apache.paimon.spark
 
-import org.apache.paimon.data
+import org.apache.paimon.data.{InternalRow => PaimonInternalRow}
 import org.apache.paimon.disk.IOManager
 import org.apache.paimon.reader.RecordReader
 import org.apache.paimon.spark.SparkUtils.createIOManager
+import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.spark.schema.PaimonMetadataColumn
 import org.apache.paimon.table.source.{ReadBuilder, Split}
 import org.apache.paimon.types.RowType
@@ -45,13 +46,13 @@ case class PaimonPartitionReaderFactory(
     val dataFields = new JList(readBuilder.readType().getFields)
     dataFields.addAll(metadataColumns.map(_.toPaimonDataField).asJava)
     val rowType = new RowType(dataFields)
-    new SparkInternalRow(rowType)
+    SparkInternalRow.create(rowType)
   }
 
   override def createReader(partition: InputPartition): PartitionReader[InternalRow] = {
     partition match {
       case paimonInputPartition: PaimonInputPartition =>
-        val readFunc: Split => RecordReader[data.InternalRow] =
+        val readFunc: Split => RecordReader[PaimonInternalRow] =
           (split: Split) => readBuilder.newRead().withIOManager(ioManager).createReader(split)
         PaimonPartitionReader(readFunc, paimonInputPartition, row, metadataColumns)
       case _ =>
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonStatistics.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonStatistics.scala
index 28af4ac0a4fdb..8dd4649330327 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonStatistics.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonStatistics.scala
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.spark
 
+import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.stats.ColStats
 import org.apache.paimon.types.{DataField, DataType, RowType}
 
@@ -118,8 +119,10 @@ object PaimonColumnStats {
   def apply(dateType: DataType, paimonColStats: ColStats[_]): PaimonColumnStats = {
     PaimonColumnStats(
       paimonColStats.nullCount,
-      Optional.ofNullable(SparkInternalRow.fromPaimon(paimonColStats.min().orElse(null), dateType)),
-      Optional.ofNullable(SparkInternalRow.fromPaimon(paimonColStats.max().orElse(null), dateType)),
+      Optional.ofNullable(
+        DataConverter
+          .fromPaimon(paimonColStats.min().orElse(null), dateType)),
+      Optional.ofNullable(DataConverter.fromPaimon(paimonColStats.max().orElse(null), dateType)),
       paimonColStats.distinctCount,
       paimonColStats.avgLen,
       paimonColStats.maxLen
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
index cd9718cf44eb2..41e7fd3c3ce90 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
@@ -20,7 +20,8 @@ package org.apache.paimon.spark.aggregate
 
 import org.apache.paimon.data.BinaryRow
 import org.apache.paimon.manifest.PartitionEntry
-import org.apache.paimon.spark.{SparkInternalRow, SparkTypeUtils}
+import org.apache.paimon.spark.SparkTypeUtils
+import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.table.{DataTable, Table}
 import org.apache.paimon.utils.{InternalRowUtils, ProjectedRow}
 
@@ -104,7 +105,7 @@ class LocalAggregator(table: Table) {
       ProjectedRow.from(requiredGroupByIndexMapping.toArray).replaceRow(partitionRow)
     // `ProjectedRow` does not support `hashCode`, so do a deep copy
     val genericRow = InternalRowUtils.copyInternalRow(projectedRow, partitionType)
-    new SparkInternalRow(partitionType).replace(genericRow)
+    SparkInternalRow.create(partitionType).replace(genericRow)
   }
 
   def update(partitionEntry: PartitionEntry): Unit = {
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/expressions/ExpressionHelper.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/expressions/ExpressionHelper.scala
index c008819fb0cc8..d4010ea338116 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/expressions/ExpressionHelper.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/expressions/ExpressionHelper.scala
@@ -23,12 +23,13 @@ import org.apache.paimon.spark.SparkFilterConverter
 import org.apache.paimon.spark.catalyst.Compatibility
 import org.apache.paimon.types.RowType
 
+import org.apache.spark.sql.{Column, SparkSession}
 import org.apache.spark.sql.PaimonUtils.{normalizeExprs, translateFilter}
-import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.analysis.Resolver
 import org.apache.spark.sql.catalyst.expressions.{Alias, And, Attribute, Cast, Expression, GetStructField, Literal, PredicateHelper, SubqueryExpression}
 import org.apache.spark.sql.catalyst.plans.logical.{Filter, LogicalPlan}
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
 import org.apache.spark.sql.types.{DataType, NullType}
 
 /** An expression helper. */
@@ -36,6 +37,14 @@ trait ExpressionHelper extends PredicateHelper {
 
   import ExpressionHelper._
 
+  def toColumn(expr: Expression): Column = {
+    SparkShimLoader.getSparkShim.column(expr)
+  }
+
+  def toExpression(spark: SparkSession, col: Column): Expression = {
+    SparkShimLoader.getSparkShim.convertToExpression(spark, col)
+  }
+
   protected def resolveExpression(
       spark: SparkSession)(expr: Expression, plan: LogicalPlan): Expression = {
     if (expr.resolved) {
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/optimizer/MergePaimonScalarSubqueriesBase.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/optimizer/MergePaimonScalarSubqueriesBase.scala
index b0b1a76e7a1f1..3428ed89f0047 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/optimizer/MergePaimonScalarSubqueriesBase.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/optimizer/MergePaimonScalarSubqueriesBase.scala
@@ -28,7 +28,7 @@ import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.trees.TreePattern.{SCALAR_SUBQUERY, SCALAR_SUBQUERY_REFERENCE, TreePattern}
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2ScanRelation
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.paimon.shims
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
 import org.apache.spark.sql.types.{DataType, StructType}
 
 import scala.collection.mutable.ArrayBuffer
@@ -344,7 +344,7 @@ trait MergePaimonScalarSubqueriesBase extends Rule[LogicalPlan] with PredicateHe
     val Seq(newPlanSupportsHashAggregate, cachedPlanSupportsHashAggregate) =
       aggregateExpressionsSeq.zip(groupByExpressionSeq).map {
         case (aggregateExpressions, groupByExpressions) =>
-          shims.Aggregate.supportsHashAggregate(
+          SparkShimLoader.getSparkShim.supportsHashAggregate(
             aggregateExpressions.flatMap(_.aggregateFunction.aggBufferAttributes),
             groupByExpressions)
       }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/BucketProcessor.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/BucketProcessor.scala
index f252b3bb130b4..57a8a8e4abfd0 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/BucketProcessor.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/BucketProcessor.scala
@@ -22,7 +22,7 @@ import org.apache.paimon.crosspartition.{GlobalIndexAssigner, KeyPartOrRow}
 import org.apache.paimon.data.{BinaryRow, GenericRow, InternalRow => PaimonInternalRow, JoinedRow}
 import org.apache.paimon.disk.IOManager
 import org.apache.paimon.index.HashBucketAssigner
-import org.apache.paimon.spark.{SparkInternalRow, SparkRow}
+import org.apache.paimon.spark.{DataConverter, SparkRow}
 import org.apache.paimon.spark.SparkUtils.createIOManager
 import org.apache.paimon.spark.util.EncoderUtils
 import org.apache.paimon.table.FileStoreTable
@@ -179,7 +179,7 @@ class GlobalIndexAssignerIterator(
         extraRow.setField(1, bucket)
         queue.enqueue(
           encoderGroup.internalToRow(
-            SparkInternalRow.fromPaimon(new JoinedRow(row, extraRow), rowType)))
+            DataConverter.fromPaimon(new JoinedRow(row, extraRow), rowType)))
       }
     )
     rowIterator.foreach {
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/MergeIntoPaimonTable.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/MergeIntoPaimonTable.scala
index f557a0cf38ee0..52e704172fc82 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/MergeIntoPaimonTable.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/MergeIntoPaimonTable.scala
@@ -38,7 +38,6 @@ import org.apache.spark.sql.catalyst.expressions.codegen.GeneratePredicate
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 import org.apache.spark.sql.functions.{col, lit, monotonically_increasing_id, sum}
-import org.apache.spark.sql.paimon.shims.ExpressionUtils.{column, convertToExpression}
 import org.apache.spark.sql.types.{ByteType, StructField, StructType}
 
 import scala.collection.mutable
@@ -153,12 +152,12 @@ case class MergeIntoPaimonTable(
       }
       if (hasUpdate(matchedActions)) {
         touchedFilePathsSet ++= findTouchedFiles(
-          targetDS.join(sourceDS, column(mergeCondition), "inner"),
+          targetDS.join(sourceDS, toColumn(mergeCondition), "inner"),
           sparkSession)
       }
       if (hasUpdate(notMatchedBySourceActions)) {
         touchedFilePathsSet ++= findTouchedFiles(
-          targetDS.join(sourceDS, column(mergeCondition), "left_anti"),
+          targetDS.join(sourceDS, toColumn(mergeCondition), "left_anti"),
           sparkSession)
       }
 
@@ -200,7 +199,7 @@ case class MergeIntoPaimonTable(
     val sourceDS = createDataset(sparkSession, sourceTable)
       .withColumn(SOURCE_ROW_COL, lit(true))
 
-    val joinedDS = sourceDS.join(targetDS, column(mergeCondition), "fullOuter")
+    val joinedDS = sourceDS.join(targetDS, toColumn(mergeCondition), "fullOuter")
     val joinedPlan = joinedDS.queryExecution.analyzed
 
     def resolveOnJoinedPlan(exprs: Seq[Expression]): Seq[Expression] = {
@@ -209,9 +208,9 @@ case class MergeIntoPaimonTable(
 
     val targetOutput = filteredTargetPlan.output
     val targetRowNotMatched = resolveOnJoinedPlan(
-      Seq(convertToExpression(sparkSession, col(SOURCE_ROW_COL).isNull))).head
+      Seq(toExpression(sparkSession, col(SOURCE_ROW_COL).isNull))).head
     val sourceRowNotMatched = resolveOnJoinedPlan(
-      Seq(convertToExpression(sparkSession, col(TARGET_ROW_COL).isNull))).head
+      Seq(toExpression(sparkSession, col(TARGET_ROW_COL).isNull))).head
     val matchedExprs = matchedActions.map(_.condition.getOrElse(TrueLiteral))
     val notMatchedExprs = notMatchedActions.map(_.condition.getOrElse(TrueLiteral))
     val notMatchedBySourceExprs = notMatchedBySourceActions.map(_.condition.getOrElse(TrueLiteral))
@@ -275,7 +274,7 @@ case class MergeIntoPaimonTable(
         .withColumn(ROW_ID_COL, monotonically_increasing_id())
       val sourceDS = createDataset(sparkSession, sourceTable)
       val count = sourceDS
-        .join(targetDS, column(mergeCondition), "inner")
+        .join(targetDS, toColumn(mergeCondition), "inner")
         .select(col(ROW_ID_COL), lit(1).as("one"))
         .groupBy(ROW_ID_COL)
         .agg(sum("one").as("count"))
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/UpdatePaimonTableCommand.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/UpdatePaimonTableCommand.scala
index f2ea965d14071..47e3f77d0e2cd 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/UpdatePaimonTableCommand.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/UpdatePaimonTableCommand.scala
@@ -33,7 +33,7 @@ import org.apache.spark.sql.catalyst.expressions.Literal.TrueLiteral
 import org.apache.spark.sql.catalyst.plans.logical.{Assignment, Filter, Project, SupportsSubquery}
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 import org.apache.spark.sql.functions.lit
-import org.apache.spark.sql.paimon.shims.ExpressionUtils.column
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
 
 case class UpdatePaimonTableCommand(
     relation: DataSourceV2Relation,
@@ -133,7 +133,8 @@ case class UpdatePaimonTableCommand(
       sparkSession: SparkSession,
       touchedDataSplits: Array[DataSplit]): Seq[CommitMessage] = {
     val updateColumns = updateExpressions.zip(relation.output).map {
-      case (update, origin) => column(update).as(origin.name, origin.metadata)
+      case (update, origin) =>
+        SparkShimLoader.getSparkShim.column(update).as(origin.name, origin.metadata)
     }
 
     val toUpdateScanRelation = createNewRelation(touchedDataSplits, relation)
@@ -156,7 +157,7 @@ case class UpdatePaimonTableCommand(
         } else {
           If(condition, update, origin)
         }
-        column(updated).as(origin.name, origin.metadata)
+        SparkShimLoader.getSparkShim.column(updated).as(origin.name, origin.metadata)
     }
 
     val data = createDataset(sparkSession, toUpdateScanRelation).select(updateColumns: _*)
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkArrayData.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkArrayData.scala
new file mode 100644
index 0000000000000..c6539a493cee9
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkArrayData.scala
@@ -0,0 +1,118 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.data
+
+import org.apache.paimon.data.InternalArray
+import org.apache.paimon.spark.DataConverter
+import org.apache.paimon.types.{ArrayType => PaimonArrayType, BigIntType, DataType => PaimonDataType, DataTypeChecks, RowType}
+import org.apache.paimon.utils.InternalRowUtils
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.expressions.SpecializedGettersReader
+import org.apache.spark.sql.catalyst.util.{ArrayData, MapData}
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
+import org.apache.spark.sql.types.{DataType, Decimal}
+import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
+
+abstract class SparkArrayData extends org.apache.spark.sql.catalyst.util.ArrayData {
+
+  def replace(array: InternalArray): SparkArrayData
+}
+
+abstract class AbstractSparkArrayData extends SparkArrayData {
+
+  val elementType: PaimonDataType
+
+  var paimonArray: InternalArray = _
+
+  override def replace(array: InternalArray): SparkArrayData = {
+    this.paimonArray = array
+    this
+  }
+
+  override def numElements(): Int = paimonArray.size()
+
+  override def copy(): ArrayData = {
+    SparkArrayData.create(elementType).replace(InternalRowUtils.copyArray(paimonArray, elementType))
+  }
+
+  override def array: Array[Any] = {
+    Array.range(0, numElements()).map {
+      i =>
+        DataConverter
+          .fromPaimon(InternalRowUtils.get(paimonArray, i, elementType), elementType)
+    }
+  }
+
+  override def setNullAt(i: Int): Unit = throw new UnsupportedOperationException()
+
+  override def update(i: Int, value: Any): Unit = throw new UnsupportedOperationException()
+
+  override def isNullAt(ordinal: Int): Boolean = paimonArray.isNullAt(ordinal)
+
+  override def getBoolean(ordinal: Int): Boolean = paimonArray.getBoolean(ordinal)
+
+  override def getByte(ordinal: Int): Byte = paimonArray.getByte(ordinal)
+
+  override def getShort(ordinal: Int): Short = paimonArray.getShort(ordinal)
+
+  override def getInt(ordinal: Int): Int = paimonArray.getInt(ordinal)
+
+  override def getLong(ordinal: Int): Long = elementType match {
+    case _: BigIntType => paimonArray.getLong(ordinal)
+    case _ =>
+      DataConverter.fromPaimon(
+        paimonArray.getTimestamp(ordinal, DataTypeChecks.getPrecision(elementType)))
+  }
+
+  override def getFloat(ordinal: Int): Float = paimonArray.getFloat(ordinal)
+
+  override def getDouble(ordinal: Int): Double = paimonArray.getDouble(ordinal)
+
+  override def getDecimal(ordinal: Int, precision: Int, scale: Int): Decimal =
+    DataConverter.fromPaimon(paimonArray.getDecimal(ordinal, precision, scale))
+
+  override def getUTF8String(ordinal: Int): UTF8String =
+    DataConverter.fromPaimon(paimonArray.getString(ordinal))
+
+  override def getBinary(ordinal: Int): Array[Byte] = paimonArray.getBinary(ordinal)
+
+  override def getInterval(ordinal: Int): CalendarInterval =
+    throw new UnsupportedOperationException()
+
+  override def getStruct(ordinal: Int, numFields: Int): InternalRow = DataConverter
+    .fromPaimon(paimonArray.getRow(ordinal, numFields), elementType.asInstanceOf[RowType])
+
+  override def getArray(ordinal: Int): ArrayData = DataConverter.fromPaimon(
+    paimonArray.getArray(ordinal),
+    elementType.asInstanceOf[PaimonArrayType])
+
+  override def getMap(ordinal: Int): MapData =
+    DataConverter.fromPaimon(paimonArray.getMap(ordinal), elementType)
+
+  override def get(ordinal: Int, dataType: DataType): AnyRef =
+    SpecializedGettersReader.read(this, ordinal, dataType, true, true)
+
+}
+
+object SparkArrayData {
+  def create(elementType: PaimonDataType): SparkArrayData = {
+    SparkShimLoader.getSparkShim.createSparkArrayData(elementType)
+  }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkInternalRow.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkInternalRow.scala
new file mode 100644
index 0000000000000..f3e607e9d7d20
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/data/SparkInternalRow.scala
@@ -0,0 +1,36 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.data
+
+import org.apache.paimon.types.RowType
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
+
+abstract class SparkInternalRow extends InternalRow {
+  def replace(row: org.apache.paimon.data.InternalRow): SparkInternalRow
+}
+
+object SparkInternalRow {
+
+  def create(rowType: RowType): SparkInternalRow = {
+    SparkShimLoader.getSparkShim.createSparkInternalRow(rowType)
+  }
+
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
index 6f47a77ef3080..e8f75d394a818 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
@@ -25,14 +25,16 @@ import org.apache.paimon.spark.execution.PaimonStrategy
 import org.apache.paimon.spark.execution.adaptive.DisableUnnecessaryPaimonBucketedScan
 
 import org.apache.spark.sql.SparkSessionExtensions
-import org.apache.spark.sql.catalyst.parser.extensions.PaimonSparkSqlExtensionsParser
+import org.apache.spark.sql.paimon.shims.SparkShimLoader
 
 /** Spark session extension to extends the syntax and adds the rules. */
 class PaimonSparkSessionExtensions extends (SparkSessionExtensions => Unit) {
 
   override def apply(extensions: SparkSessionExtensions): Unit = {
     // parser extensions
-    extensions.injectParser { case (_, parser) => new PaimonSparkSqlExtensionsParser(parser) }
+    extensions.injectParser {
+      case (_, parser) => SparkShimLoader.getSparkShim.createSparkParser(parser)
+    }
 
     // analyzer extensions
     extensions.injectResolutionRule(spark => new PaimonAnalysis(spark))
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
similarity index 98%
rename from paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala
rename to paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
index 9ece186930d71..c1d61e9738344 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/PaimonSparkSqlExtensionsParser.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
@@ -47,8 +47,8 @@ import java.util.Locale
  * @param delegate
  *   The extension parser.
  */
-class PaimonSparkSqlExtensionsParser(val delegate: ParserInterface)
-  extends org.apache.spark.sql.paimon.shims.ParserInterface
+abstract class AbstractPaimonSparkSqlExtensionsParser(val delegate: ParserInterface)
+  extends org.apache.spark.sql.catalyst.parser.ParserInterface
   with Logging {
 
   private lazy val substitutor = new VariableSubstitution()
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
index 265c828661952..2ab3dc4945245 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
@@ -23,10 +23,7 @@ import org.apache.spark.SparkConf
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.catalog.ExternalCatalog
 import org.apache.spark.sql.internal.StaticSQLConf.CATALOG_IMPLEMENTATION
-import org.apache.spark.util.Utils
-
-import scala.reflect.ClassTag
-import scala.util.control.NonFatal
+import org.apache.spark.sql.paimon.ReflectUtils
 
 object PaimonCatalogUtils {
 
@@ -37,22 +34,10 @@ object PaimonCatalogUtils {
       } else {
         "org.apache.spark.sql.catalyst.catalog.InMemoryCatalog"
       }
-    reflect[ExternalCatalog, SparkConf, Configuration](externalCatalogClassName, conf, hadoopConf)
-  }
-
-  private def reflect[T, Arg1 <: AnyRef, Arg2 <: AnyRef](
-      className: String,
-      ctorArg1: Arg1,
-      ctorArg2: Arg2)(implicit ctorArgTag1: ClassTag[Arg1], ctorArgTag2: ClassTag[Arg2]): T = {
-    try {
-      val clazz = Utils.classForName(className)
-      val ctor = clazz.getDeclaredConstructor(ctorArgTag1.runtimeClass, ctorArgTag2.runtimeClass)
-      val args = Array[AnyRef](ctorArg1, ctorArg2)
-      ctor.newInstance(args: _*).asInstanceOf[T]
-    } catch {
-      case NonFatal(e) =>
-        throw new IllegalArgumentException(s"Error while instantiating '$className':", e)
-    }
+    ReflectUtils.reflect[ExternalCatalog, SparkConf, Configuration](
+      externalCatalogClassName,
+      conf,
+      hadoopConf)
   }
 
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/ReflectUtils.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/ReflectUtils.scala
new file mode 100644
index 0000000000000..bedac542ab8bc
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/ReflectUtils.scala
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.paimon
+
+import org.apache.spark.util.Utils
+
+import scala.reflect.ClassTag
+import scala.util.control.NonFatal
+
+object ReflectUtils {
+
+  def reflect[T, Arg1 <: AnyRef, Arg2 <: AnyRef](className: String, ctorArg1: Arg1, ctorArg2: Arg2)(
+      implicit
+      ctorArgTag1: ClassTag[Arg1],
+      ctorArgTag2: ClassTag[Arg2]): T = {
+    try {
+      val clazz = Utils.classForName(className)
+      val ctor = clazz.getDeclaredConstructor(ctorArgTag1.runtimeClass, ctorArgTag2.runtimeClass)
+      val args = Array[AnyRef](ctorArg1, ctorArg2)
+      ctor.newInstance(args: _*).asInstanceOf[T]
+    } catch {
+      case NonFatal(e) =>
+        throw new IllegalArgumentException(s"Error while instantiating '$className':", e)
+    }
+  }
+
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
new file mode 100644
index 0000000000000..bd85282737e99
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
@@ -0,0 +1,61 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.paimon.shims
+
+import org.apache.paimon.spark.data.{SparkArrayData, SparkInternalRow}
+import org.apache.paimon.types.{DataType, RowType}
+
+import org.apache.spark.sql.{Column, SparkSession}
+import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
+import org.apache.spark.sql.catalyst.parser.ParserInterface
+import org.apache.spark.sql.connector.catalog.{Identifier, Table, TableCatalog}
+import org.apache.spark.sql.connector.expressions.Transform
+import org.apache.spark.sql.types.StructType
+
+import java.util.{Map => JMap}
+
+/**
+ * A spark shim trait. It declare methods which have incompatible implementations between Spark 3
+ * and Spark 4. The specific SparkShim implementation will be loaded through Service Provider
+ * Interface.
+ */
+trait SparkShim {
+
+  def createSparkParser(delegate: ParserInterface): ParserInterface
+
+  def createSparkInternalRow(rowType: RowType): SparkInternalRow
+
+  def createSparkArrayData(elementType: DataType): SparkArrayData
+
+  def supportsHashAggregate(
+      aggregateBufferAttributes: Seq[Attribute],
+      groupingExpression: Seq[Expression]): Boolean
+
+  def createTable(
+      tableCatalog: TableCatalog,
+      ident: Identifier,
+      schema: StructType,
+      partitions: Array[Transform],
+      properties: JMap[String, String]): Table
+
+  def column(expr: Expression): Column
+
+  def convertToExpression(spark: SparkSession, column: Column): Expression
+
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShimLoader.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShimLoader.scala
new file mode 100644
index 0000000000000..920896547a1e2
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShimLoader.scala
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.paimon.shims
+
+import java.util.ServiceLoader
+
+import scala.collection.JavaConverters._
+
+/** Load a [[SparkShim]]'s implementation. */
+object SparkShimLoader {
+
+  private lazy val sparkShim: SparkShim = loadSparkShim()
+
+  def getSparkShim: SparkShim = {
+    sparkShim
+  }
+
+  private def loadSparkShim(): SparkShim = {
+    val shims = ServiceLoader.load(classOf[SparkShim]).asScala
+    if (shims.isEmpty) {
+      throw new IllegalStateException("No available spark shim here.")
+    } else if (shims.size > 1) {
+      throw new IllegalStateException("Found more than one spark shim here.")
+    }
+    shims.head
+  }
+}
diff --git a/paimon-spark/paimon-spark-ut/pom.xml b/paimon-spark/paimon-spark-ut/pom.xml
new file mode 100644
index 0000000000000..0a18405964875
--- /dev/null
+++ b/paimon-spark/paimon-spark-ut/pom.xml
@@ -0,0 +1,180 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>org.apache.paimon</groupId>
+        <artifactId>paimon-spark</artifactId>
+        <version>1.0-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>paimon-spark-ut</artifactId>
+    <name>Paimon : Spark : UT</name>
+
+    <properties>
+        <spark.version>${paimon-spark-common.spark.version}</spark.version>
+        <jackson.version>${paimon.shade.jackson.version}</jackson.version>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>${paimon-sparkx-common}</artifactId>
+            <version>${project.version}</version>
+            <scope>test</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <scope>test</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-core_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.module</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-sql_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-sql_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-catalyst_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-core_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <classifier>tests</classifier>
+            <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.module</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-hive_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>com.google.protobuf</groupId>
+                    <artifactId>protobuf-java</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-avro_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>test</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>com.fasterxml.jackson.module</groupId>
+            <artifactId>jackson-module-scala_${scala.binary.version}</artifactId>
+            <version>${jackson.version}</version>
+            <scope>test</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>com.google.protobuf</groupId>
+            <artifactId>protobuf-java</artifactId>
+            <version>${protobuf-java.version}</version>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-jar-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>prepare-test-jar</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>test-jar</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+
+        </plugins>
+    </build>
+</project>
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkCatalogWithHiveTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkFilterConverterTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFilterConverterTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkFilterConverterTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFilterConverterTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkGenericCatalogTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkGenericCatalogTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkGenericCatalogTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkGenericCatalogTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkGenericCatalogWithHiveTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkGenericCatalogWithHiveTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkGenericCatalogWithHiveTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkGenericCatalogWithHiveTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java
similarity index 95%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java
index b98213c0e662b..1117ad58c7376 100644
--- a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java
+++ b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkInternalRowTest.java
@@ -25,6 +25,7 @@
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.data.Timestamp;
+import org.apache.paimon.spark.data.SparkInternalRow;
 import org.apache.paimon.utils.DateTimeUtils;
 
 import org.apache.spark.sql.catalyst.CatalystTypeConverters;
@@ -95,7 +96,7 @@ public void test() {
                                 SparkTypeUtils.fromPaimonType(ALL_TYPES)));
         org.apache.spark.sql.Row sparkRow =
                 (org.apache.spark.sql.Row)
-                        sparkConverter.apply(new SparkInternalRow(ALL_TYPES).replace(rowData));
+                        sparkConverter.apply(SparkInternalRow.create(ALL_TYPES).replace(rowData));
 
         String expected =
                 "1,"
@@ -122,7 +123,8 @@ public void test() {
         SparkRow sparkRowData = new SparkRow(ALL_TYPES, sparkRow);
         sparkRow =
                 (org.apache.spark.sql.Row)
-                        sparkConverter.apply(new SparkInternalRow(ALL_TYPES).replace(sparkRowData));
+                        sparkConverter.apply(
+                                SparkInternalRow.create(ALL_TYPES).replace(sparkRowData));
         assertThat(sparkRowToString(sparkRow)).isEqualTo(expected);
         TimeZone.setDefault(tz);
     }
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkReadITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadTestBase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkReadTestBase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkReadTestBase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkReadTestBase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkS3ITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkS3ITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkS3ITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkS3ITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTimeTravelITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTimeTravelITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTimeTravelITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTimeTravelITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTimeTravelWithDataFrameITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTimeTravelWithDataFrameITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTimeTravelWithDataFrameITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTimeTravelWithDataFrameITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTypeTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTypeTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkTypeTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkTypeTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkWriteITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkWriteITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkWriteITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkWriteITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkWriteWithKyroITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkWriteWithKyroITCase.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/SparkWriteWithKyroITCase.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkWriteWithKyroITCase.java
diff --git a/paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
rename to paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
diff --git a/paimon-spark/paimon-spark-common/src/test/resources/META-INF/services/org.junit.jupiter.api.extension.Extension b/paimon-spark/paimon-spark-ut/src/test/resources/META-INF/services/org.junit.jupiter.api.extension.Extension
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/resources/META-INF/services/org.junit.jupiter.api.extension.Extension
rename to paimon-spark/paimon-spark-ut/src/test/resources/META-INF/services/org.junit.jupiter.api.extension.Extension
diff --git a/paimon-spark/paimon-spark-common/src/test/resources/hive-site.xml b/paimon-spark/paimon-spark-ut/src/test/resources/hive-site.xml
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/resources/hive-site.xml
rename to paimon-spark/paimon-spark-ut/src/test/resources/hive-site.xml
diff --git a/paimon-spark/paimon-spark-common/src/test/resources/log4j2-test.properties b/paimon-spark/paimon-spark-ut/src/test/resources/log4j2-test.properties
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/resources/log4j2-test.properties
rename to paimon-spark/paimon-spark-ut/src/test/resources/log4j2-test.properties
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonCDCSourceTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonCDCSourceTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonCDCSourceTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonCDCSourceTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonCommitTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonCommitTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonCommitTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonCommitTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
similarity index 98%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
index 842147615d1a7..6d2ffea04df54 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonHiveTestBase.scala
@@ -22,7 +22,7 @@ import org.apache.paimon.hive.TestHiveMetastore
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.spark.SparkConf
-import org.apache.spark.paimon.Utils
+import org.apache.spark.sql.paimon.Utils
 
 import java.io.File
 
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSourceTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSourceTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSourceTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSourceTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
similarity index 79%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
index 9b4a344259a93..605b2e6ca5f26 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
@@ -25,11 +25,12 @@ import org.apache.paimon.spark.sql.{SparkVersionSupport, WithTableOptions}
 import org.apache.paimon.table.FileStoreTable
 
 import org.apache.spark.SparkConf
-import org.apache.spark.paimon.Utils
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.connector.catalog.{Identifier => SparkIdentifier}
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Relation, DataSourceV2ScanRelation}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.paimon.Utils
 import org.apache.spark.sql.test.SharedSparkSession
 import org.scalactic.source.Position
 import org.scalatest.Tag
@@ -105,7 +106,7 @@ class PaimonSparkTestBase
   }
 
   protected def withTimeZone(timeZone: String)(f: => Unit): Unit = {
-    withSQLConf("spark.sql.session.timeZone" -> timeZone) {
+    withSparkSQLConf("spark.sql.session.timeZone" -> timeZone) {
       val originTimeZone = TimeZone.getDefault
       try {
         TimeZone.setDefault(TimeZone.getTimeZone(timeZone))
@@ -116,6 +117,40 @@ class PaimonSparkTestBase
     }
   }
 
+  // Since SPARK-46227 has changed the definition of withSQLConf that resulted in
+  // incompatibility between the Spark3.x and Spark4.x, So Paimon declare a separate method
+  // to provide the same function.
+  protected def withSparkSQLConf(pairs: (String, String)*)(f: => Unit): Unit = {
+    withSparkSQLConf0(pairs: _*)(f)
+  }
+
+  private def withSparkSQLConf0(pairs: (String, String)*)(f: => Unit): Unit = {
+    val conf = SQLConf.get
+    val (keys, values) = pairs.unzip
+    val currentValues = keys.map {
+      key =>
+        if (conf.contains(key)) {
+          Some(conf.getConfString(key))
+        } else {
+          None
+        }
+    }
+    (keys, values).zipped.foreach {
+      (k, v) =>
+        if (SQLConf.isStaticConfigKey(k)) {
+          throw new RuntimeException(s"Cannot modify the value of a static config: $k")
+        }
+        conf.setConfString(k, v)
+    }
+    try f
+    finally {
+      keys.zip(currentValues).foreach {
+        case (key, Some(value)) => conf.setConfString(key, value)
+        case (key, None) => conf.unsetConf(key)
+      }
+    }
+  }
+
   override def test(testName: String, testTags: Tag*)(testFun: => Any)(implicit
       pos: Position): Unit = {
     println(testName)
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonTableTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/PaimonTableTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonTableTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala
similarity index 97%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala
index fc787246f9f12..a3223446f644b 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/ScanHelperTest.scala
@@ -26,7 +26,6 @@ import org.apache.paimon.table.source.{DataSplit, Split}
 
 import org.junit.jupiter.api.Assertions
 
-import java.util
 import java.util.{HashMap => JHashMap}
 
 import scala.collection.JavaConverters._
@@ -35,7 +34,7 @@ import scala.collection.mutable
 class ScanHelperTest extends PaimonSparkTestBase {
 
   test("Paimon: reshuffle splits") {
-    withSQLConf(("spark.sql.leafNodeDefaultParallelism", "20")) {
+    withSparkSQLConf(("spark.sql.leafNodeDefaultParallelism", "20")) {
       val splitNum = 5
       val fileNum = 100
 
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/AlterBranchProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/AlterBranchProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/AlterBranchProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/AlterBranchProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/BranchProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/BranchProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/BranchProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/BranchProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CompactManifestProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactManifestProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CompactManifestProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactManifestProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CreateAndDeleteTagProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CreateAndDeleteTagProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CreateAndDeleteTagProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CreateAndDeleteTagProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CreateTagFromTimestampProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CreateTagFromTimestampProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/CreateTagFromTimestampProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CreateTagFromTimestampProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpireSnapshotsProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpireSnapshotsProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpireSnapshotsProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpireSnapshotsProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpireTagsProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpireTagsProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ExpireTagsProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpireTagsProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/FastForwardProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/FastForwardProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/FastForwardProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/FastForwardProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MarkPartitionDoneProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MarkPartitionDoneProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MarkPartitionDoneProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MarkPartitionDoneProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateDatabaseProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateDatabaseProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateDatabaseProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateDatabaseProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateFileProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateFileProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateFileProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateFileProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateTableProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateTableProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/MigrateTableProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/MigrateTableProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/RemoveOrphanFilesProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ReplaceTagProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ReplaceTagProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/ReplaceTagProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ReplaceTagProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RollbackProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/RollbackProcedureTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/procedure/RollbackProcedureTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/RollbackProcedureTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala
similarity index 97%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala
index 238dd039969a8..4f8ccae22dd55 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/AnalyzeTableTestBase.scala
@@ -86,7 +86,7 @@ abstract class AnalyzeTableTestBase extends PaimonSparkTestBase {
 
     spark.sql(s"ANALYZE TABLE T COMPUTE STATISTICS")
 
-    withSQLConf("spark.paimon.scan.timestamp-millis" -> System.currentTimeMillis.toString) {
+    withSparkSQLConf("spark.paimon.scan.timestamp-millis" -> System.currentTimeMillis.toString) {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(2, 0, 2, "{ }"))
@@ -97,7 +97,7 @@ abstract class AnalyzeTableTestBase extends PaimonSparkTestBase {
 
     spark.sql(s"ANALYZE TABLE T COMPUTE STATISTICS")
 
-    withSQLConf("spark.paimon.scan.timestamp-millis" -> System.currentTimeMillis.toString) {
+    withSparkSQLConf("spark.paimon.scan.timestamp-millis" -> System.currentTimeMillis.toString) {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(5, 0, 4, "{ }"))
@@ -111,31 +111,31 @@ abstract class AnalyzeTableTestBase extends PaimonSparkTestBase {
       spark.sql("CALL paimon.sys.create_tag(table => 'test.T', tag => 'test_tag6', snapshot => 6)"),
       Row(true) :: Nil)
 
-    withSQLConf("spark.paimon.scan.tag-name" -> "test_tag5") {
+    withSparkSQLConf("spark.paimon.scan.tag-name" -> "test_tag5") {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(2, 0, 2, "{ }"))
     }
 
-    withSQLConf("spark.paimon.scan.tag-name" -> "test_tag6") {
+    withSparkSQLConf("spark.paimon.scan.tag-name" -> "test_tag6") {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(5, 0, 4, "{ }"))
     }
 
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "3") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "3") {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(2, 0, 2, "{ }"))
     }
 
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "4") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "4") {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(2, 0, 2, "{ }"))
     }
 
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "6") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "6") {
       checkAnswer(
         sql("SELECT snapshot_id, schema_id, mergedRecordCount, colstat FROM `T$statistics`"),
         Row(5, 0, 4, "{ }"))
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala
similarity index 97%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala
index afc70bf9105df..35931924c4875 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/BucketedTableQueryTest.scala
@@ -29,12 +29,12 @@ class BucketedTableQueryTest extends PaimonSparkTestBase with AdaptiveSparkPlanH
   private def checkAnswerAndShuffleSorts(query: String, numShuffles: Int, numSorts: Int): Unit = {
     var expectedResult: Array[Row] = null
     // avoid config default value change in future, so specify it manually
-    withSQLConf(
+    withSparkSQLConf(
       "spark.sql.sources.v2.bucketing.enabled" -> "false",
       "spark.sql.autoBroadcastJoinThreshold" -> "-1") {
       expectedResult = spark.sql(query).collect()
     }
-    withSQLConf(
+    withSparkSQLConf(
       "spark.sql.sources.v2.bucketing.enabled" -> "true",
       "spark.sql.autoBroadcastJoinThreshold" -> "-1") {
       val df = spark.sql(query)
@@ -162,10 +162,10 @@ class BucketedTableQueryTest extends PaimonSparkTestBase with AdaptiveSparkPlanH
       checkAnswerAndShuffleSorts("select max(c) OVER (PARTITION BY id ORDER BY id) from t1", 0, 1)
       checkAnswerAndShuffleSorts("select sum(id) OVER (PARTITION BY c ORDER BY id) from t1", 1, 1)
 
-      withSQLConf("spark.sql.requireAllClusterKeysForDistribution" -> "false") {
+      withSparkSQLConf("spark.sql.requireAllClusterKeysForDistribution" -> "false") {
         checkAnswerAndShuffleSorts("SELECT id, c, count(*) FROM t1 GROUP BY id, c", 0, 0)
       }
-      withSQLConf("spark.sql.requireAllClusterKeysForDistribution" -> "true") {
+      withSparkSQLConf("spark.sql.requireAllClusterKeysForDistribution" -> "true") {
         checkAnswerAndShuffleSorts("SELECT id, c, count(*) FROM t1 GROUP BY id, c", 1, 0)
       }
     }
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
similarity index 97%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
index b09a2be98dc8d..6ad5274496a90 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
@@ -238,21 +238,21 @@ abstract class DDLTestBase extends PaimonSparkTestBase {
                    |USING PAIMON
                    |""".stripMargin)
 
-      withSQLConf("spark.sql.legacy.charVarcharAsString" -> "true") {
+      withSparkSQLConf("spark.sql.legacy.charVarcharAsString" -> "true") {
         sql("INSERT INTO paimon_tbl VALUES (1, 'ab')")
       }
 
-      withSQLConf("spark.sql.legacy.charVarcharAsString" -> "false") {
+      withSparkSQLConf("spark.sql.legacy.charVarcharAsString" -> "false") {
         sql("INSERT INTO paimon_tbl VALUES (2, 'ab')")
       }
 
       if (gteqSpark3_4) {
-        withSQLConf("spark.sql.readSideCharPadding" -> "true") {
+        withSparkSQLConf("spark.sql.readSideCharPadding" -> "true") {
           checkAnswer(
             spark.sql("SELECT c FROM paimon_tbl ORDER BY id"),
             Row("ab    ") :: Row("ab    ") :: Nil)
         }
-        withSQLConf("spark.sql.readSideCharPadding" -> "false") {
+        withSparkSQLConf("spark.sql.readSideCharPadding" -> "false") {
           checkAnswer(
             spark.sql("SELECT c FROM paimon_tbl ORDER BY id"),
             Row("ab") :: Row("ab    ") :: Nil)
@@ -270,7 +270,8 @@ abstract class DDLTestBase extends PaimonSparkTestBase {
       format =>
         Seq(true, false).foreach {
           datetimeJava8APIEnabled =>
-            withSQLConf("spark.sql.datetime.java8API.enabled" -> datetimeJava8APIEnabled.toString) {
+            withSparkSQLConf(
+              "spark.sql.datetime.java8API.enabled" -> datetimeJava8APIEnabled.toString) {
               withTimeZone("Asia/Shanghai") {
                 withTable("paimon_tbl") {
                   // Spark support create table with timestamp_ntz since 3.4
@@ -430,7 +431,8 @@ abstract class DDLTestBase extends PaimonSparkTestBase {
   test("Paimon DDL: select table with timestamp and timestamp_ntz with filter") {
     Seq(true, false).foreach {
       datetimeJava8APIEnabled =>
-        withSQLConf("spark.sql.datetime.java8API.enabled" -> datetimeJava8APIEnabled.toString) {
+        withSparkSQLConf(
+          "spark.sql.datetime.java8API.enabled" -> datetimeJava8APIEnabled.toString) {
           withTable("paimon_tbl") {
             // Spark support create table with timestamp_ntz since 3.4
             if (gteqSpark3_4) {
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
similarity index 99%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index 9be8e21a8df2d..e99e4434ef7f1 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -304,7 +304,7 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
         withTempDir {
           tbLocation =>
             withDatabase("paimon_db") {
-              spark.sql(s"CREATE DATABASE paimon_db")
+              spark.sql(s"CREATE DATABASE IF NOT EXISTS paimon_db")
               spark.sql(s"USE paimon_db")
               withTable("external_tbl", "managed_tbl") {
                 val expertTbLocation = tbLocation.getCanonicalPath
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DeleteFromTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeleteFromTableTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DeleteFromTableTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeleteFromTableTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
similarity index 99%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
index e944429e42184..ea8309e14ffef 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
@@ -25,13 +25,13 @@ import org.apache.paimon.spark.{PaimonSparkTestBase, PaimonSplitScan}
 import org.apache.paimon.spark.schema.PaimonMetadataColumn
 import org.apache.paimon.table.FileStoreTable
 
-import org.apache.spark.paimon.Utils
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.execution.{QueryExecution, SparkPlan}
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.columnar.InMemoryTableScanExec
 import org.apache.spark.sql.execution.datasources.v2.{BatchScanExec, DataSourceV2Relation}
 import org.apache.spark.sql.functions.lit
+import org.apache.spark.sql.paimon.Utils
 import org.apache.spark.sql.util.QueryExecutionListener
 import org.junit.jupiter.api.Assertions
 
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala
similarity index 97%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala
index 70339bd7cac3e..f47d40285aa9a 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DisableUnnecessaryPaimonBucketedScanSuite.scala
@@ -48,13 +48,13 @@ class DisableUnnecessaryPaimonBucketedScanSuite
       assert(bucketedScan.length == expectedNumBucketedScan, query)
     }
 
-    withSQLConf("spark.sql.sources.v2.bucketing.enabled" -> "true") {
-      withSQLConf("spark.sql.sources.bucketing.autoBucketedScan.enabled" -> "true") {
+    withSparkSQLConf("spark.sql.sources.v2.bucketing.enabled" -> "true") {
+      withSparkSQLConf("spark.sql.sources.bucketing.autoBucketedScan.enabled" -> "true") {
         val df = sql(query)
         val result = df.collect()
         checkNumBucketedScan(df, expectedNumScanWithAutoScanEnabled)
 
-        withSQLConf("spark.sql.sources.bucketing.autoBucketedScan.enabled" -> "false") {
+        withSparkSQLConf("spark.sql.sources.bucketing.autoBucketedScan.enabled" -> "false") {
           val expected = sql(query)
           checkAnswer(expected, result)
           checkNumBucketedScan(expected, expectedNumScanWithAutoScanDisabled)
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DynamicBucketTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DynamicBucketTableTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/DynamicBucketTableTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DynamicBucketTableTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
similarity index 99%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
index 674b45fda68b2..03026e8574295 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
@@ -346,7 +346,7 @@ abstract class InsertOverwriteTableTestBase extends PaimonSparkTestBase {
               spark.sql("SELECT * FROM T ORDER BY a, b"),
               Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
 
-            withSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
+            withSparkSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
               // dynamic overwrite the a=1 partition
               spark.sql("INSERT OVERWRITE T VALUES (1, 5, '5'), (1, 7, '7')")
               checkAnswer(
@@ -387,7 +387,7 @@ abstract class InsertOverwriteTableTestBase extends PaimonSparkTestBase {
                 "ptv2",
                 22) :: Nil)
 
-            withSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
+            withSparkSQLConf("spark.sql.sources.partitionOverwriteMode" -> "dynamic") {
               // dynamic overwrite the pt2=22 partition
               spark.sql(
                 "INSERT OVERWRITE T PARTITION (pt2 = 22) VALUES (3, 'c2', 'ptv1'), (4, 'd2', 'ptv3')")
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/LookupCompactionTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/LookupCompactionTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/LookupCompactionTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/LookupCompactionTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/MergeIntoNotMatchedBySourceTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/MergeIntoNotMatchedBySourceTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/MergeIntoNotMatchedBySourceTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/MergeIntoNotMatchedBySourceTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/MergeIntoTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/MergeIntoTableTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/MergeIntoTableTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/MergeIntoTableTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/ObjectTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/ObjectTableTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/ObjectTableTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/ObjectTableTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonCompositePartitionKeyTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonCompositePartitionKeyTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonCompositePartitionKeyTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonCompositePartitionKeyTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonFunctionTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonFunctionTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonFunctionTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonFunctionTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonMetricTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonMetricTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonMetricTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonMetricTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala
similarity index 90%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala
index 78e8905fa969a..87f4c94486192 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptimizationTestBase.scala
@@ -20,6 +20,7 @@ package org.apache.paimon.spark.sql
 
 import org.apache.paimon.Snapshot.CommitKind
 import org.apache.paimon.spark.PaimonSparkTestBase
+import org.apache.paimon.spark.catalyst.analysis.expressions.ExpressionHelper
 import org.apache.paimon.spark.catalyst.optimizer.MergePaimonScalarSubqueries
 
 import org.apache.spark.sql.Row
@@ -27,11 +28,12 @@ import org.apache.spark.sql.catalyst.expressions.{Attribute, CreateNamedStruct,
 import org.apache.spark.sql.catalyst.plans.logical.{CTERelationDef, LogicalPlan, OneRowRelation, WithCTE}
 import org.apache.spark.sql.catalyst.rules.RuleExecutor
 import org.apache.spark.sql.functions._
+import org.apache.spark.sql.paimon.Utils
 import org.junit.jupiter.api.Assertions
 
 import scala.collection.immutable
 
-abstract class PaimonOptimizationTestBase extends PaimonSparkTestBase {
+abstract class PaimonOptimizationTestBase extends PaimonSparkTestBase with ExpressionHelper {
 
   import org.apache.spark.sql.catalyst.dsl.expressions._
   import org.apache.spark.sql.catalyst.dsl.plans._
@@ -59,24 +61,25 @@ abstract class PaimonOptimizationTestBase extends PaimonSparkTestBase {
                                |""".stripMargin)
       val optimizedPlan = Optimize.execute(query.queryExecution.analyzed)
 
-      val relation = createRelationV2("T")
-      val mergedSubquery = relation
+      val df = Utils.createDataFrame(spark, createRelationV2("T"))
+      val mergedSubquery = df
         .select(
-          count(Literal(1)).as("cnt"),
-          sum(col("a").expr).as("sum_a"),
-          avg(col("b").expr).as("avg_b")
+          toColumn(count(Literal(1))).as("cnt"),
+          toColumn(sum(toExpression(spark, col("a")))).as("sum_a"),
+          toColumn(avg(toExpression(spark, col("b"))).as("avg_b"))
         )
         .select(
-          CreateNamedStruct(
-            Seq(
-              Literal("cnt"),
-              'cnt,
-              Literal("sum_a"),
-              'sum_a,
-              Literal("avg_b"),
-              'avg_b
-            )).as("mergedValue"))
-      val analyzedMergedSubquery = mergedSubquery.analyze
+          toColumn(
+            CreateNamedStruct(
+              Seq(
+                Literal("cnt"),
+                'cnt,
+                Literal("sum_a"),
+                'sum_a,
+                Literal("avg_b"),
+                'avg_b
+              )).as("mergedValue")))
+      val analyzedMergedSubquery = mergedSubquery.queryExecution.analyzed
       val correctAnswer = WithCTE(
         OneRowRelation()
           .select(
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala
similarity index 91%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala
index f74d6959b9f16..44df3e54ca724 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonOptionTest.scala
@@ -29,7 +29,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
   import testImplicits._
 
   test("Paimon Option: create table with sql conf") {
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "2") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "2") {
       sql("CREATE TABLE T (id INT)")
       val table = loadTable("T")
       // check options in schema file directly
@@ -39,7 +39,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
   }
 
   test("Paimon Option: create table by dataframe with sql conf") {
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "2") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "2") {
       Seq((1L, "x1"), (2L, "x2"))
         .toDF("a", "b")
         .write
@@ -61,13 +61,13 @@ class PaimonOptionTest extends PaimonSparkTestBase {
     val table = loadTable("T")
 
     // query with mutable option
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T ORDER BY id"), Row(1))
       checkAnswer(spark.read.format("paimon").load(table.location().toString), Row(1))
     }
 
     // query with immutable option
-    withSQLConf("spark.paimon.bucket" -> "1") {
+    withSparkSQLConf("spark.paimon.bucket" -> "1") {
       assertThrows[UnsupportedOperationException] {
         sql("SELECT * FROM T ORDER BY id")
       }
@@ -85,19 +85,19 @@ class PaimonOptionTest extends PaimonSparkTestBase {
     val table = loadTable("T")
 
     // query with global options
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T ORDER BY id"), Row(1))
       checkAnswer(spark.read.format("paimon").load(table.location().toString), Row(1))
     }
 
     // query with table options
-    withSQLConf("spark.paimon.*.*.T.scan.snapshot-id" -> "1") {
+    withSparkSQLConf("spark.paimon.*.*.T.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T ORDER BY id"), Row(1))
       checkAnswer(spark.read.format("paimon").load(table.location().toString), Row(1))
     }
 
     // query with both global and table options
-    withSQLConf(
+    withSparkSQLConf(
       "spark.paimon.scan.snapshot-id" -> "1",
       "spark.paimon.*.*.T.scan.snapshot-id" -> "2") {
       checkAnswer(sql("SELECT * FROM T ORDER BY id"), Row(1) :: Row(2) :: Nil)
@@ -122,7 +122,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
     val table2 = loadTable("T1")
 
     // query with global options
-    withSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
+    withSparkSQLConf("spark.paimon.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T1 join T2 on T1.id = T2.id ORDER BY T1.id"), Row(1, 1))
       checkAnswer(
         spark.read
@@ -134,7 +134,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
     }
 
     // query with table options
-    withSQLConf("spark.paimon.*.*.*.scan.snapshot-id" -> "1") {
+    withSparkSQLConf("spark.paimon.*.*.*.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T1 join T2 on T1.id = T2.id ORDER BY T1.id"), Row(1, 1))
       checkAnswer(
         spark.read
@@ -146,7 +146,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
     }
 
     // query with both global and table options
-    withSQLConf(
+    withSparkSQLConf(
       "spark.paimon.scan.snapshot-id" -> "1",
       "spark.paimon.*.*.*.scan.snapshot-id" -> "2") {
       checkAnswer(
@@ -161,7 +161,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
       )
     }
 
-    withSQLConf(
+    withSparkSQLConf(
       "spark.paimon.*.*.T1.scan.snapshot-id" -> "1",
       "spark.paimon.*.*.T2.scan.snapshot-id" -> "1") {
       checkAnswer(sql("SELECT * FROM T1 join T2 on T1.id = T2.id ORDER BY T1.id"), Row(1, 1))
@@ -174,7 +174,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
       )
     }
 
-    withSQLConf(
+    withSparkSQLConf(
       "spark.paimon.*.*.T1.scan.snapshot-id" -> "1",
       "spark.paimon.*.*.T2.scan.snapshot-id" -> "2") {
       checkAnswer(sql("SELECT * FROM T1 join T2 on T1.id = T2.id ORDER BY T1.id"), Row(1, 1))
@@ -187,7 +187,7 @@ class PaimonOptionTest extends PaimonSparkTestBase {
       )
     }
 
-    withSQLConf(
+    withSparkSQLConf(
       "spark.paimon.*.*.T1.scan.snapshot-id" -> "2",
       "spark.paimon.*.*.T2.scan.snapshot-id" -> "2") {
       checkAnswer(
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonPartitionManagementTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPartitionManagementTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonPartitionManagementTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPartitionManagementTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala
similarity index 99%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala
index beea19c35e925..08f5275f01b50 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonQueryTest.scala
@@ -281,7 +281,7 @@ class PaimonQueryTest extends PaimonSparkTestBase {
 
                   // Since Spark 4.0, when `spark.sql.ansi.enabled` is `true` and `array[i]` does not exist, an exception
                   // will be thrown instead of returning null. Here, just disabled it and return null for test.
-                  withSQLConf("spark.sql.ansi.enabled" -> "false") {
+                  withSparkSQLConf("spark.sql.ansi.enabled" -> "false") {
                     checkAnswer(
                       sql(s"""
                              |SELECT
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonShowColumnsTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonShowColumnsTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonShowColumnsTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonShowColumnsTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonTagDdlTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonTagDdlTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonTagDdlTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonTagDdlTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/SparkVersionSupport.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/SparkVersionSupport.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/SparkVersionSupport.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/SparkVersionSupport.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/UpdateTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/UpdateTableTestBase.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/UpdateTableTestBase.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/UpdateTableTestBase.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/WithTableOptions.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/WithTableOptions.scala
similarity index 100%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/paimon/spark/sql/WithTableOptions.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/WithTableOptions.scala
diff --git a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/spark/paimon/Utils.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/spark/sql/paimon/Utils.scala
similarity index 74%
rename from paimon-spark/paimon-spark-common/src/test/scala/org/apache/spark/paimon/Utils.scala
rename to paimon-spark/paimon-spark-ut/src/test/scala/org/apache/spark/sql/paimon/Utils.scala
index 5ea2dd861e197..03f1c7706efbd 100644
--- a/paimon-spark/paimon-spark-common/src/test/scala/org/apache/spark/paimon/Utils.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/spark/sql/paimon/Utils.scala
@@ -16,9 +16,10 @@
  * limitations under the License.
  */
 
-package org.apache.spark.paimon
+package org.apache.spark.sql.paimon
 
-import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.{DataFrame, Dataset, SparkSession}
+import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.util.{Utils => SparkUtils}
 
 import java.io.File
@@ -28,9 +29,14 @@ import java.io.File
  */
 object Utils {
 
-  def createTempDir: File = SparkUtils.createTempDir()
+  def createTempDir: File = SparkUtils.createTempDir(System.getProperty("java.io.tmpdir"), "spark")
 
   def waitUntilEventEmpty(spark: SparkSession): Unit = {
     spark.sparkContext.listenerBus.waitUntilEmpty()
   }
+
+  def createDataFrame(sparkSession: SparkSession, plan: LogicalPlan): DataFrame = {
+    Dataset.ofRows(sparkSession, plan)
+  }
+
 }
diff --git a/paimon-spark/paimon-spark3-common/pom.xml b/paimon-spark/paimon-spark3-common/pom.xml
index 03d29ea05b3ad..5fd869f1b3938 100644
--- a/paimon-spark/paimon-spark3-common/pom.xml
+++ b/paimon-spark/paimon-spark3-common/pom.xml
@@ -39,9 +39,35 @@ under the License.
 
     <dependencies>
         <dependency>
-            <groupId>org.apache.spark</groupId>
-            <artifactId>spark-sql_${scala.binary.version}</artifactId>
-            <version>${spark.version}</version>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
         </dependency>
     </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-shade-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>shade-paimon</id>
+                        <phase>package</phase>
+                        <goals>
+                            <goal>shade</goal>
+                        </goals>
+                        <configuration>
+                            <artifactSet>
+                                <includes combine.children="append">
+                                    <include>org.apache.paimon:paimon-bundle</include>
+                                    <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                </includes>
+                            </artifactSet>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
+        </plugins>
+    </build>
 </project>
\ No newline at end of file
diff --git a/paimon-spark/paimon-spark3-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim b/paimon-spark/paimon-spark3-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
new file mode 100644
index 0000000000000..b79ef54f6e309
--- /dev/null
+++ b/paimon-spark/paimon-spark3-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
@@ -0,0 +1,16 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+org.apache.spark.sql.paimon.shims.Spark3Shim
\ No newline at end of file
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark3SqlExtensionsParser.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark3SqlExtensionsParser.scala
new file mode 100644
index 0000000000000..07481b6f639f8
--- /dev/null
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark3SqlExtensionsParser.scala
@@ -0,0 +1,25 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.parser.extensions
+
+import org.apache.spark.sql.catalyst.parser.ParserInterface
+import org.apache.spark.sql.catalyst.parser.extensions.AbstractPaimonSparkSqlExtensionsParser
+
+class PaimonSpark3SqlExtensionsParser(override val delegate: ParserInterface)
+  extends AbstractPaimonSparkSqlExtensionsParser(delegate) {}
diff --git a/paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/spark/paimon/Utils.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3ArrayData.scala
similarity index 73%
rename from paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/spark/paimon/Utils.scala
rename to paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3ArrayData.scala
index 1a899f5001536..cb393d928dcbc 100644
--- a/paimon-spark/paimon-spark-3.2/src/test/scala/org/apache/spark/paimon/Utils.scala
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3ArrayData.scala
@@ -16,17 +16,8 @@
  * limitations under the License.
  */
 
-package org.apache.spark.paimon
+package org.apache.paimon.spark.data
 
-import org.apache.spark.util.{Utils => SparkUtils}
+import org.apache.paimon.types.DataType
 
-import java.io.File
-
-/**
- * A wrapper that some Objects or Classes is limited to access beyond [[org.apache.spark]] package.
- */
-object Utils {
-
-  def createTempDir: File = SparkUtils.createTempDir()
-
-}
+class Spark3ArrayData(override val elementType: DataType) extends AbstractSparkArrayData {}
diff --git a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/spark/paimon/Utils.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3InternalRow.scala
similarity index 73%
rename from paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/spark/paimon/Utils.scala
rename to paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3InternalRow.scala
index 1a899f5001536..9c9a1c6bac959 100644
--- a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/spark/paimon/Utils.scala
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/data/Spark3InternalRow.scala
@@ -16,17 +16,9 @@
  * limitations under the License.
  */
 
-package org.apache.spark.paimon
+package org.apache.paimon.spark.data
 
-import org.apache.spark.util.{Utils => SparkUtils}
+import org.apache.paimon.spark.AbstractSparkInternalRow
+import org.apache.paimon.types.RowType
 
-import java.io.File
-
-/**
- * A wrapper that some Objects or Classes is limited to access beyond [[org.apache.spark]] package.
- */
-object Utils {
-
-  def createTempDir: File = SparkUtils.createTempDir()
-
-}
+class Spark3InternalRow(rowType: RowType) extends AbstractSparkInternalRow(rowType) {}
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
similarity index 51%
rename from paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala
rename to paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
index 13ade3f3c5ac6..57d79d6474e9a 100644
--- a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
@@ -16,45 +16,44 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.paimon
+package org.apache.spark.sql.paimon.shims
+
+import org.apache.paimon.spark.catalyst.parser.extensions.PaimonSpark3SqlExtensionsParser
+import org.apache.paimon.spark.data.{Spark3ArrayData, Spark3InternalRow, SparkArrayData, SparkInternalRow}
+import org.apache.paimon.types.{DataType, RowType}
 
 import org.apache.spark.sql.{Column, SparkSession}
-import org.apache.spark.sql.catalyst.{InternalRow => SparkInternalRow}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
-import org.apache.spark.sql.catalyst.parser.{ParserInterface => SparkParserInterface}
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate => SparkAggregate}
-import org.apache.spark.sql.catalyst.util.{ArrayData => SparkArrayData}
-import org.apache.spark.sql.connector.catalog.{Identifier, Table, TableCatalog => SparkTableCatalog}
+import org.apache.spark.sql.catalyst.parser.ParserInterface
+import org.apache.spark.sql.catalyst.plans.logical.Aggregate
+import org.apache.spark.sql.connector.catalog.{Identifier, Table, TableCatalog}
 import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.types.StructType
 
 import java.util.{Map => JMap}
 
-/** Shims for Spark 3.x in [[org.apache.spark.sql]]. */
-object shims {
-
-  /** In [[org.apache.spark.sql.catalyst]]. */
+class Spark3Shim extends SparkShim {
 
-  abstract class ParserInterface extends SparkParserInterface {
-    val delegate: SparkParserInterface
+  override def createSparkParser(delegate: ParserInterface): ParserInterface = {
+    new PaimonSpark3SqlExtensionsParser(delegate)
   }
 
-  abstract class ArrayData extends SparkArrayData {}
-
-  abstract class InternalRow extends SparkInternalRow {}
+  override def createSparkInternalRow(rowType: RowType): SparkInternalRow = {
+    new Spark3InternalRow(rowType)
+  }
 
-  object Aggregate {
-    def supportsHashAggregate(
-        aggregateBufferAttributes: Seq[Attribute],
-        groupingExpression: Seq[Expression]): Boolean = {
-      SparkAggregate.supportsHashAggregate(aggregateBufferAttributes)
-    }
+  override def createSparkArrayData(elementType: DataType): SparkArrayData = {
+    new Spark3ArrayData(elementType)
   }
 
-  /** In [[org.apache.spark.sql.connector]]. */
+  override def supportsHashAggregate(
+      aggregateBufferAttributes: Seq[Attribute],
+      groupingExpression: Seq[Expression]): Boolean = {
+    Aggregate.supportsHashAggregate(aggregateBufferAttributes)
+  }
 
-  def createTable(
-      tableCatalog: SparkTableCatalog,
+  override def createTable(
+      tableCatalog: TableCatalog,
       ident: Identifier,
       schema: StructType,
       partitions: Array[Transform],
@@ -62,11 +61,8 @@ object shims {
     tableCatalog.createTable(ident, schema, partitions, properties)
   }
 
-  /** In [[org.apache.spark.sql.internal]]. */
+  override def column(expr: Expression): Column = new Column(expr)
 
-  object ExpressionUtils {
-    def column(expr: Expression): Column = new Column(expr)
+  override def convertToExpression(spark: SparkSession, column: Column): Expression = column.expr
 
-    def convertToExpression(spark: SparkSession, column: Column): Expression = column.expr
-  }
 }
diff --git a/paimon-spark/paimon-spark4-common/pom.xml b/paimon-spark/paimon-spark4-common/pom.xml
index dcc5b370d59aa..d160b984fa056 100644
--- a/paimon-spark/paimon-spark4-common/pom.xml
+++ b/paimon-spark/paimon-spark4-common/pom.xml
@@ -38,10 +38,57 @@ under the License.
     </properties>
 
     <dependencies>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-spark-common_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+
         <dependency>
             <groupId>org.apache.spark</groupId>
-            <artifactId>spark-sql_${scala.binary.version}</artifactId>
+            <artifactId>spark-sql-api_2.13</artifactId>
             <version>${spark.version}</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>log4j</groupId>
+                    <artifactId>log4j</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.slf4j</groupId>
+                    <artifactId>slf4j-log4j12</artifactId>
+                </exclusion>
+                <exclusion>
+                    <groupId>org.apache.logging.log4j</groupId>
+                    <artifactId>log4j-slf4j2-impl</artifactId>
+                </exclusion>
+            </exclusions>
         </dependency>
+
     </dependencies>
-</project>
\ No newline at end of file
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-shade-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>shade-paimon</id>
+                        <phase>package</phase>
+                        <goals>
+                            <goal>shade</goal>
+                        </goals>
+                        <configuration>
+                            <artifactSet>
+                                <includes combine.children="append">
+                                    <include>org.apache.paimon:paimon-bundle</include>
+                                    <include>org.apache.paimon:paimon-spark-common_${scala.binary.version}</include>
+                                </includes>
+                            </artifactSet>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/paimon-spark/paimon-spark4-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim b/paimon-spark/paimon-spark4-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
new file mode 100644
index 0000000000000..b0df8c67cf9a4
--- /dev/null
+++ b/paimon-spark/paimon-spark4-common/src/main/resources/META-INF/services/org.apache.spark.sql.paimon.shims.SparkShim
@@ -0,0 +1,16 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+org.apache.spark.sql.paimon.shims.Spark4Shim
\ No newline at end of file
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark4SqlExtensionsParser.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark4SqlExtensionsParser.scala
new file mode 100644
index 0000000000000..ef1f5763d27b1
--- /dev/null
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/parser/extensions/PaimonSpark4SqlExtensionsParser.scala
@@ -0,0 +1,28 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.parser.extensions
+
+import org.apache.spark.sql.catalyst.parser.{CompoundBody, ParserInterface}
+import org.apache.spark.sql.catalyst.parser.extensions.AbstractPaimonSparkSqlExtensionsParser
+
+class PaimonSpark4SqlExtensionsParser(override val delegate: ParserInterface)
+  extends AbstractPaimonSparkSqlExtensionsParser(delegate) {
+
+  def parseScript(sqlScriptText: String): CompoundBody = delegate.parseScript(sqlScriptText)
+}
diff --git a/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/spark/paimon/Utils.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4ArrayData.scala
similarity index 72%
rename from paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/spark/paimon/Utils.scala
rename to paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4ArrayData.scala
index 1a899f5001536..be319c0a9c232 100644
--- a/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/spark/paimon/Utils.scala
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4ArrayData.scala
@@ -16,17 +16,14 @@
  * limitations under the License.
  */
 
-package org.apache.spark.paimon
+package org.apache.paimon.spark.data
 
-import org.apache.spark.util.{Utils => SparkUtils}
+import org.apache.paimon.types.DataType
 
-import java.io.File
+import org.apache.spark.unsafe.types.VariantVal
 
-/**
- * A wrapper that some Objects or Classes is limited to access beyond [[org.apache.spark]] package.
- */
-object Utils {
+class Spark4ArrayData(override val elementType: DataType) extends AbstractSparkArrayData {
 
-  def createTempDir: File = SparkUtils.createTempDir()
+  override def getVariant(ordinal: Int): VariantVal = throw new UnsupportedOperationException
 
 }
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4InternalRow.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4InternalRow.scala
new file mode 100644
index 0000000000000..54b0f420ea931
--- /dev/null
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/data/Spark4InternalRow.scala
@@ -0,0 +1,28 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.data
+
+import org.apache.paimon.spark.AbstractSparkInternalRow
+import org.apache.paimon.types.RowType
+
+import org.apache.spark.unsafe.types.VariantVal
+
+class Spark4InternalRow(rowType: RowType) extends AbstractSparkInternalRow(rowType) {
+  override def getVariant(i: Int): VariantVal = throw new UnsupportedOperationException
+}
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala
deleted file mode 100644
index ee6c9ad35857f..0000000000000
--- a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims.scala
+++ /dev/null
@@ -1,86 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.paimon
-
-import org.apache.spark.sql.{Column, SparkSession}
-import org.apache.spark.sql.catalyst.{InternalRow => SparkInternalRow}
-import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
-import org.apache.spark.sql.catalyst.parser.{CompoundBody, ParserInterface => SparkParserInterface}
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate => SparkAggregate}
-import org.apache.spark.sql.catalyst.util.{ArrayData => SparkArrayData}
-import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, Table, TableCatalog => SparkTableCatalog}
-import org.apache.spark.sql.connector.expressions.Transform
-import org.apache.spark.sql.internal.{ExpressionUtils => SparkExpressionUtils}
-import org.apache.spark.sql.types.StructType
-import org.apache.spark.unsafe.types.VariantVal
-
-import java.util.{Map => JMap}
-
-/** Shims for Spark 4.x in [[org.apache.spark.sql]]. */
-object shims {
-
-  /** In [[org.apache.spark.sql.catalyst]]. */
-
-  abstract class ParserInterface extends SparkParserInterface {
-    val delegate: SparkParserInterface
-
-    def parseScript(sqlScriptText: String): CompoundBody = delegate.parseScript(sqlScriptText)
-  }
-
-  abstract class ArrayData extends SparkArrayData {
-    def getVariant(ordinal: Int): VariantVal = throw new UnsupportedOperationException
-  }
-
-  abstract class InternalRow extends SparkInternalRow {
-    override def getVariant(i: Int): VariantVal = throw new UnsupportedOperationException
-  }
-
-  object Aggregate {
-    def supportsHashAggregate(
-        aggregateBufferAttributes: Seq[Attribute],
-        groupingExpression: Seq[Expression]): Boolean = {
-      SparkAggregate.supportsHashAggregate(aggregateBufferAttributes, groupingExpression)
-    }
-  }
-
-  /** In [[org.apache.spark.sql.connector]]. */
-
-  def createTable(
-      tableCatalog: SparkTableCatalog,
-      ident: Identifier,
-      schema: StructType,
-      partitions: Array[Transform],
-      properties: JMap[String, String]): Table = {
-    tableCatalog.createTable(
-      ident,
-      CatalogV2Util.structTypeToV2Columns(schema),
-      partitions,
-      properties)
-  }
-
-  /** In [[org.apache.spark.sql.internal]]. */
-
-  object ExpressionUtils {
-    def column(expr: Expression): Column = SparkExpressionUtils.column(expr)
-
-    def convertToExpression(spark: SparkSession, column: Column): Expression = {
-      spark.expression(column)
-    }
-  }
-}
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala
new file mode 100644
index 0000000000000..dfec4eb71f4f1
--- /dev/null
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.paimon.shims
+
+import org.apache.paimon.spark.catalyst.parser.extensions.PaimonSpark4SqlExtensionsParser
+import org.apache.paimon.spark.data.{Spark4ArrayData, Spark4InternalRow, SparkArrayData, SparkInternalRow}
+import org.apache.paimon.types.{DataType, RowType}
+
+import org.apache.spark.sql.{Column, SparkSession}
+import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
+import org.apache.spark.sql.catalyst.parser.ParserInterface
+import org.apache.spark.sql.catalyst.plans.logical.Aggregate
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, Table, TableCatalog}
+import org.apache.spark.sql.connector.expressions.Transform
+import org.apache.spark.sql.internal.ExpressionUtils
+import org.apache.spark.sql.types.StructType
+
+import java.util.{Map => JMap}
+
+class Spark4Shim extends SparkShim {
+
+  override def createSparkParser(delegate: ParserInterface): ParserInterface = {
+    new PaimonSpark4SqlExtensionsParser(delegate)
+  }
+  override def createSparkInternalRow(rowType: RowType): SparkInternalRow = {
+    new Spark4InternalRow(rowType)
+  }
+
+  override def createSparkArrayData(elementType: DataType): SparkArrayData = {
+    new Spark4ArrayData(elementType)
+  }
+
+  def supportsHashAggregate(
+      aggregateBufferAttributes: Seq[Attribute],
+      groupingExpression: Seq[Expression]): Boolean = {
+    Aggregate.supportsHashAggregate(aggregateBufferAttributes, groupingExpression)
+  }
+
+  def createTable(
+      tableCatalog: TableCatalog,
+      ident: Identifier,
+      schema: StructType,
+      partitions: Array[Transform],
+      properties: JMap[String, String]): Table = {
+    val columns = CatalogV2Util.structTypeToV2Columns(schema)
+    tableCatalog.createTable(ident, columns, partitions, properties)
+  }
+
+  def column(expr: Expression): Column = ExpressionUtils.column(expr)
+
+  def convertToExpression(spark: SparkSession, column: Column): Expression =
+    spark.expression(column)
+}
diff --git a/paimon-spark/pom.xml b/paimon-spark/pom.xml
index aac73baa5fec4..61ecd20a0500a 100644
--- a/paimon-spark/pom.xml
+++ b/paimon-spark/pom.xml
@@ -39,6 +39,7 @@ under the License.
 
     <modules>
         <module>paimon-spark-common</module>
+        <module>paimon-spark-ut</module>
     </modules>
 
     <dependencyManagement>
@@ -114,6 +115,21 @@ under the License.
                 </exclusions>
             </dependency>
 
+            <dependency>
+                <groupId>org.apache.spark</groupId>
+                <artifactId>spark-hive_${scala.binary.version}</artifactId>
+                <exclusions>
+                    <exclusion>
+                        <groupId>log4j</groupId>
+                        <artifactId>log4j</artifactId>
+                    </exclusion>
+                    <exclusion>
+                        <groupId>org.slf4j</groupId>
+                        <artifactId>slf4j-log4j12</artifactId>
+                    </exclusion>
+                </exclusions>
+            </dependency>
+
             <dependency>
                 <groupId>org.apache.paimon</groupId>
                 <artifactId>paimon-bundle</artifactId>
@@ -180,22 +196,6 @@ under the License.
                     </exclusion>
                 </exclusions>
             </dependency>
-
-            <dependency>
-                <groupId>org.apache.spark</groupId>
-                <artifactId>spark-hive_${scala.binary.version}</artifactId>
-                <scope>test</scope>
-                <exclusions>
-                    <exclusion>
-                        <groupId>log4j</groupId>
-                        <artifactId>log4j</artifactId>
-                    </exclusion>
-                    <exclusion>
-                        <groupId>org.slf4j</groupId>
-                        <artifactId>slf4j-log4j12</artifactId>
-                    </exclusion>
-                </exclusions>
-            </dependency>
         </dependencies>
     </dependencyManagement>
 
@@ -278,6 +278,12 @@ under the License.
             <artifactId>aws-java-sdk-core</artifactId>
             <version>${aws.version}</version>
             <scope>test</scope>
+            <exclusions>
+                <exclusion>
+                    <groupId>com.fasterxml.jackson.core</groupId>
+                    <artifactId>*</artifactId>
+                </exclusion>
+            </exclusions>
         </dependency>
 
         <dependency>

From 139b5a75a5f0b89bc9d9c91f8c06dfb68691c9e0 Mon Sep 17 00:00:00 2001
From: xleoken <xleoken@163.com>
Date: Tue, 26 Nov 2024 17:00:45 +0800
Subject: [PATCH 066/157] [core] Improve the performance of show tables (#4592)

---
 .../org/apache/paimon/catalog/AbstractCatalog.java    | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index d3a8d628a2bc6..16b76513d7efd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -653,7 +653,16 @@ protected List<String> listTablesInFileSystem(Path databasePath) throws IOExcept
     }
 
     protected boolean tableExistsInFileSystem(Path tablePath, String branchName) {
-        return !new SchemaManager(fileIO, tablePath, branchName).listAllIds().isEmpty();
+        SchemaManager schemaManager = new SchemaManager(fileIO, tablePath, branchName);
+
+        // in order to improve the performance, check the schema-0 firstly.
+        boolean schemaZeroExists = schemaManager.schemaExists(0);
+        if (schemaZeroExists) {
+            return true;
+        } else {
+            // if schema-0 not exists, fallback to check other schemas
+            return !schemaManager.listAllIds().isEmpty();
+        }
     }
 
     public Optional<TableSchema> tableSchemaInFileSystem(Path tablePath, String branchName) {

From 01d2bb21b22c8380acc94e30e2f2267809d575e1 Mon Sep 17 00:00:00 2001
From: Yann Byron <biyan900116@gmail.com>
Date: Tue, 26 Nov 2024 17:07:58 +0800
Subject: [PATCH 067/157] [spark] define spark properties globally (#4593)

---
 pom.xml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/pom.xml b/pom.xml
index 24f2923319508..85a880f35158e 100644
--- a/pom.xml
+++ b/pom.xml
@@ -115,6 +115,12 @@ under the License.
         <test.flink.connector.kafka.version>3.0.1-1.18</test.flink.connector.kafka.version>
         <test.mysql.connector.java.version>8.0.27</test.mysql.connector.java.version>
 
+        <!-- spark profile properties-->
+        <paimon-sparkx-common>paimon-spark3-common</paimon-sparkx-common>
+        <paimon-spark-common.spark.version>3.5.3</paimon-spark-common.spark.version>
+        <test.spark.main.version>3.3</test.spark.main.version>
+        <test.spark.version>3.3.0</test.spark.version>
+
         <zstd-jni.version>1.5.5-11</zstd-jni.version>
         <janino.version>3.0.11</janino.version>
         <mockito.version>3.4.6</mockito.version>

From a67bab179214be54b90b39119c2045cb075fe55e Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Tue, 26 Nov 2024 20:15:18 +0800
Subject: [PATCH 068/157] [spark] Explicitly set spark3 profile in publish
 snapshot (#4595)

---
 .github/workflows/publish_snapshot.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publish_snapshot.yml b/.github/workflows/publish_snapshot.yml
index 7d370814da947..c7f97cab991f9 100644
--- a/.github/workflows/publish_snapshot.yml
+++ b/.github/workflows/publish_snapshot.yml
@@ -64,6 +64,6 @@ jobs:
           echo "<password>$ASF_PASSWORD</password>" >> $tmp_settings
           echo "</server></servers></settings>" >> $tmp_settings
           
-          mvn --settings $tmp_settings clean deploy -Dgpg.skip -Drat.skip -DskipTests -Papache-release
+          mvn --settings $tmp_settings clean deploy -Dgpg.skip -Drat.skip -DskipTests -Papache-release,spark3
 
           rm $tmp_settings

From 7a390135617a86906f172a391a182a9b3b3dae04 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Wed, 27 Nov 2024 10:24:40 +0800
Subject: [PATCH 069/157] [doc] Add changelog merging into changelog-producer

---
 docs/content/maintenance/write-performance.md        |  9 ---------
 docs/content/primary-key-table/changelog-producer.md | 11 +++++++++++
 2 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/docs/content/maintenance/write-performance.md b/docs/content/maintenance/write-performance.md
index 02362b9096e7e..ade2c3353e3cc 100644
--- a/docs/content/maintenance/write-performance.md
+++ b/docs/content/maintenance/write-performance.md
@@ -160,12 +160,3 @@ You can use fine-grained-resource-management of Flink to increase committer heap
 1. Configure Flink Configuration `cluster.fine-grained-resource-management.enabled: true`. (This is default after Flink 1.18)
 2. Configure Paimon Table Options: `sink.committer-memory`, for example 300 MB, depends on your `TaskManager`.
    (`sink.committer-cpu` is also supported)
-
-## Changelog Compaction
-
-If Flink's checkpoint interval is short (for example, 30 seconds) and the number of buckets is large,
-each snapshot may produce lots of small changelog files.
-Too many files may put a burden on the distributed storage cluster.
-
-In order to compact small changelog files into large ones, you can set the table option `changelog.precommit-compact = true`.
-Default value of this option is false, if true, it will add a compact coordinator and worker operator after the writer operator, which copies changelog files into large ones.
diff --git a/docs/content/primary-key-table/changelog-producer.md b/docs/content/primary-key-table/changelog-producer.md
index 011f7b6f27a7f..a9364ee9f07c5 100644
--- a/docs/content/primary-key-table/changelog-producer.md
+++ b/docs/content/primary-key-table/changelog-producer.md
@@ -130,3 +130,14 @@ efficient as the input changelog producer and the latency to produce changelog m
 
 Full-compaction changelog-producer supports `changelog-producer.row-deduplicate` to avoid generating -U, +U
 changelog for the same record.
+
+## Changelog Merging
+
+For `input`, `lookup`, `full-compaction` 'changelog-producer'.
+
+If Flink's checkpoint interval is short (for example, 30 seconds) and the number of buckets is large, each snapshot may
+produce lots of small changelog files. Too many files may put a burden on the distributed storage cluster.
+
+In order to compact small changelog files into large ones, you can set the table option `changelog.precommit-compact = true`.
+Default value of this option is false, if true, it will add a compact coordinator and worker operator after the writer
+operator, which copies changelog files into large ones.

From 0185f7c19bd798e2f1e03934d48e82f09893576b Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 27 Nov 2024 14:25:18 +0800
Subject: [PATCH 070/157] [core] Drop stats for overwrite commit (#4598)

---
 .../java/org/apache/paimon/operation/FileStoreCommitImpl.java  | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index 69efce9189514..bbd9b27ee6572 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -176,7 +176,8 @@ public FileStoreCommitImpl(
         this.manifestFile = manifestFileFactory.create();
         this.manifestList = manifestListFactory.create();
         this.indexManifestFile = indexManifestFileFactory.create();
-        this.scan = scan;
+        // Stats in DELETE Manifest Entries is useless
+        this.scan = scan.dropStats();
         this.numBucket = numBucket;
         this.manifestTargetSize = manifestTargetSize;
         this.manifestFullCompactionSize = manifestFullCompactionSize;

From a79b08bc668c16e143e3f0126d59dea2a7253b11 Mon Sep 17 00:00:00 2001
From: LsomeYeah <94825748+LsomeYeah@users.noreply.github.com>
Date: Wed, 27 Nov 2024 15:09:19 +0800
Subject: [PATCH 071/157] [core] Add tests for drop stats for overwrite commit
 (#4600)

---
 .../paimon/operation/FileStoreCommitTest.java | 29 +++++++++++++++++++
 1 file changed, 29 insertions(+)

diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
index 67945df60ce83..de4ee684b830f 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
@@ -31,8 +31,11 @@
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.index.IndexFileHandler;
 import org.apache.paimon.index.IndexFileMeta;
+import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.IndexManifestEntry;
 import org.apache.paimon.manifest.ManifestCommittable;
+import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.mergetree.compact.DeduplicateMergeFunction;
 import org.apache.paimon.predicate.PredicateBuilder;
@@ -80,6 +83,7 @@
 
 import static org.apache.paimon.index.HashIndexFile.HASH_INDEX;
 import static org.apache.paimon.partition.PartitionPredicate.createPartitionPredicate;
+import static org.apache.paimon.stats.SimpleStats.EMPTY_STATS;
 import static org.apache.paimon.testutils.assertj.PaimonAssertions.anyCauseMatches;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.assertj.core.api.Assertions.assertThatThrownBy;
@@ -943,6 +947,31 @@ public void testManifestCompact() throws Exception {
                 .isEqualTo(0);
     }
 
+    @Test
+    public void testDropStatsForOverwrite() throws Exception {
+        TestFileStore store = createStore(false);
+
+        List<KeyValue> keyValues = generateDataList(1);
+        BinaryRow partition = gen.getPartition(keyValues.get(0));
+        // commit 1
+        Snapshot snapshot1 =
+                store.commitData(keyValues, s -> partition, kv -> 0, Collections.emptyMap()).get(0);
+        // overwrite commit 2
+        Snapshot snapshot2 =
+                store.overwriteData(keyValues, s -> partition, kv -> 0, Collections.emptyMap())
+                        .get(0);
+        ManifestFile manifestFile = store.manifestFileFactory().create();
+        List<ManifestEntry> entries =
+                store.manifestListFactory().create().readDataManifests(snapshot2).stream()
+                        .flatMap(meta -> manifestFile.read(meta.fileName()).stream())
+                        .collect(Collectors.toList());
+        for (ManifestEntry manifestEntry : entries) {
+            if (manifestEntry.kind() == FileKind.DELETE) {
+                assertThat(manifestEntry.file().valueStats()).isEqualTo(EMPTY_STATS);
+            }
+        }
+    }
+
     @Test
     public void testManifestCompactFull() throws Exception {
         // Disable full compaction by options.

From 530efddbe2f201cbfbe9a5e40211464f3df4895a Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Wed, 27 Nov 2024 16:58:07 +0800
Subject: [PATCH 072/157] [test] Fix build Spark utit workflow on jdk11 (#4596)

---
 .github/workflows/utitcase-jdk11.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/utitcase-jdk11.yml b/.github/workflows/utitcase-jdk11.yml
index f1d7c25cbe44a..878ce5f968981 100644
--- a/.github/workflows/utitcase-jdk11.yml
+++ b/.github/workflows/utitcase-jdk11.yml
@@ -53,7 +53,7 @@ jobs:
           jvm_timezone=$(random_timezone)
           echo "JVM timezone is set to $jvm_timezone"
           test_modules="!paimon-e2e-tests,!org.apache.paimon:paimon-hive-connector-3.1,"
-          for suffix in 3.5 3.4 3.3 3.2 common; do
+          for suffix in 3.5 3.4 3.3 3.2 ut; do
           test_modules+="!org.apache.paimon:paimon-spark-${suffix},"
           done
           test_modules="${test_modules%,}"

From 7e4148ab890f1e62b448447216a9b9558bd025bc Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Wed, 27 Nov 2024 17:46:13 +0800
Subject: [PATCH 073/157] [flink] Avoids miscellaneous deprecated APIs for 2.0
 Preview (#4590)

---
 .../org/apache/paimon/flink/FlinkFileIO.java  | 24 ++++++++++++++++--
 .../flink/source/FileStoreSourceReader.java   | 23 -----------------
 .../source/align/AlignedSourceReader.java     |  2 +-
 .../paimon/flink/CatalogTableITCase.java      | 25 +++++++++++--------
 .../flink/source/IteratorSourcesITCase.java   |  4 +--
 .../util/MiniClusterWithClientExtension.java  |  6 -----
 .../flink/util/ReadWriteTableTestUtil.java    |  6 ++---
 7 files changed, 42 insertions(+), 48 deletions(-)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkFileIO.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkFileIO.java
index 74512409bfc80..617d25125f371 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkFileIO.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkFileIO.java
@@ -29,10 +29,10 @@
 import org.apache.flink.core.fs.FSDataOutputStream;
 import org.apache.flink.core.fs.FileSystem;
 import org.apache.flink.core.fs.FileSystem.WriteMode;
-import org.apache.flink.core.fs.FileSystemKind;
 
 import java.io.IOException;
 import java.io.UncheckedIOException;
+import java.util.Locale;
 
 /** Flink {@link FileIO} to use {@link FileSystem}. */
 public class FlinkFileIO implements FileIO {
@@ -48,7 +48,27 @@ public FlinkFileIO(Path path) {
     @Override
     public boolean isObjectStore() {
         try {
-            return path.getFileSystem().getKind() != FileSystemKind.FILE_SYSTEM;
+            FileSystem fs = path.getFileSystem();
+            String scheme = fs.getUri().getScheme().toLowerCase(Locale.US);
+
+            if (scheme.startsWith("s3")
+                    || scheme.startsWith("emr")
+                    || scheme.startsWith("oss")
+                    || scheme.startsWith("wasb")
+                    || scheme.startsWith("gs")) {
+                // the Amazon S3 storage or Aliyun OSS storage or Azure Blob Storage
+                // or Google Cloud Storage
+                return true;
+            } else if (scheme.startsWith("http") || scheme.startsWith("ftp")) {
+                // file servers instead of file systems
+                // they might actually be consistent, but we have no hard guarantees
+                // currently to rely on that
+                return true;
+            } else {
+                // the remainder should include hdfs, kosmos, ceph, ...
+                // this also includes federated HDFS (viewfs).
+                return false;
+            }
         } catch (IOException e) {
             throw new UncheckedIOException(e);
         }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FileStoreSourceReader.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FileStoreSourceReader.java
index 92adf5e04998e..8fc78c868ba57 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FileStoreSourceReader.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FileStoreSourceReader.java
@@ -25,9 +25,7 @@
 
 import org.apache.flink.api.connector.source.SourceReader;
 import org.apache.flink.api.connector.source.SourceReaderContext;
-import org.apache.flink.connector.base.source.reader.RecordsWithSplitIds;
 import org.apache.flink.connector.base.source.reader.SingleThreadMultiplexSourceReaderBase;
-import org.apache.flink.connector.base.source.reader.synchronization.FutureCompletingBlockingQueue;
 import org.apache.flink.connector.file.src.reader.BulkFormat.RecordIterator;
 import org.apache.flink.table.data.RowData;
 
@@ -64,27 +62,6 @@ public FileStoreSourceReader(
         this.ioManager = ioManager;
     }
 
-    public FileStoreSourceReader(
-            SourceReaderContext readerContext,
-            TableRead tableRead,
-            FileStoreSourceReaderMetrics metrics,
-            IOManager ioManager,
-            @Nullable Long limit,
-            FutureCompletingBlockingQueue<RecordsWithSplitIds<RecordIterator<RowData>>>
-                    elementsQueue) {
-        super(
-                elementsQueue,
-                () ->
-                        new FileStoreSourceSplitReader(
-                                tableRead, RecordLimiter.create(limit), metrics),
-                (element, output, state) ->
-                        FlinkRecordsWithSplitIds.emitRecord(
-                                readerContext, element, output, state, metrics),
-                readerContext.getConfiguration(),
-                readerContext);
-        this.ioManager = ioManager;
-    }
-
     @Override
     public void start() {
         // we request a split only if we did not get splits during the checkpoint restore
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedSourceReader.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedSourceReader.java
index 1f0bbca314b63..a8ffe3de561f9 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedSourceReader.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/align/AlignedSourceReader.java
@@ -58,7 +58,7 @@ public AlignedSourceReader(
             @Nullable Long limit,
             FutureCompletingBlockingQueue<RecordsWithSplitIds<BulkFormat.RecordIterator<RowData>>>
                     elementsQueue) {
-        super(readerContext, tableRead, metrics, ioManager, limit, elementsQueue);
+        super(readerContext, tableRead, metrics, ioManager, limit);
         this.elementsQueue = elementsQueue;
         this.nextCheckpointId = null;
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
index 2a855796d8d45..96334de3f87b5 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
@@ -251,17 +251,20 @@ public void testSchemasTable() {
         sql("ALTER TABLE T SET ('snapshot.num-retained.min' = '18')");
         sql("ALTER TABLE T SET ('manifest.format' = 'avro')");
 
-        assertThat(sql("SHOW CREATE TABLE T$schemas").toString())
-                .isEqualTo(
-                        "[+I[CREATE TABLE `PAIMON`.`default`.`T$schemas` (\n"
-                                + "  `schema_id` BIGINT NOT NULL,\n"
-                                + "  `fields` VARCHAR(2147483647) NOT NULL,\n"
-                                + "  `partition_keys` VARCHAR(2147483647) NOT NULL,\n"
-                                + "  `primary_keys` VARCHAR(2147483647) NOT NULL,\n"
-                                + "  `options` VARCHAR(2147483647) NOT NULL,\n"
-                                + "  `comment` VARCHAR(2147483647),\n"
-                                + "  `update_time` TIMESTAMP(3) NOT NULL\n"
-                                + ") ]]");
+        String actualResult = sql("SHOW CREATE TABLE T$schemas").toString();
+        String expectedResult =
+                "[+I[CREATE TABLE `PAIMON`.`default`.`T$schemas` (\n"
+                        + "  `schema_id` BIGINT NOT NULL,\n"
+                        + "  `fields` VARCHAR(2147483647) NOT NULL,\n"
+                        + "  `partition_keys` VARCHAR(2147483647) NOT NULL,\n"
+                        + "  `primary_keys` VARCHAR(2147483647) NOT NULL,\n"
+                        + "  `options` VARCHAR(2147483647) NOT NULL,\n"
+                        + "  `comment` VARCHAR(2147483647),\n"
+                        + "  `update_time` TIMESTAMP(3) NOT NULL\n"
+                        + ") ]]";
+        actualResult = actualResult.replace(" ", "").replace("\n", "");
+        expectedResult = expectedResult.replace(" ", "").replace("\n", "");
+        assertThat(actualResult).isEqualTo(expectedResult);
 
         List<Row> result =
                 sql(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/IteratorSourcesITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/IteratorSourcesITCase.java
index 8404d994fa9f2..0c5d485af7bc9 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/IteratorSourcesITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/IteratorSourcesITCase.java
@@ -18,10 +18,10 @@
 
 package org.apache.paimon.flink.source;
 
+import org.apache.commons.collections.IteratorUtils;
 import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.runtime.testutils.MiniClusterResourceConfiguration;
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.datastream.DataStreamUtils;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.test.util.MiniClusterWithClientResource;
@@ -67,7 +67,7 @@ public void testParallelSourceExecution() throws Exception {
                         "iterator source");
 
         final List<RowData> result =
-                DataStreamUtils.collectBoundedStream(stream, "Iterator Source Test");
+                IteratorUtils.toList(stream.executeAndCollect("Iterator Source Test"));
 
         verifySequence(result, 1L, 1_000L);
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/MiniClusterWithClientExtension.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/MiniClusterWithClientExtension.java
index cfc23a0a44d8d..39939f78670b9 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/MiniClusterWithClientExtension.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/MiniClusterWithClientExtension.java
@@ -29,7 +29,6 @@
 import org.apache.flink.runtime.testutils.MiniClusterResourceConfiguration;
 import org.apache.flink.streaming.util.TestStreamEnvironment;
 import org.apache.flink.test.junit5.InjectClusterClient;
-import org.apache.flink.test.util.TestEnvironment;
 import org.junit.jupiter.api.extension.AfterAllCallback;
 import org.junit.jupiter.api.extension.AfterEachCallback;
 import org.junit.jupiter.api.extension.BeforeAllCallback;
@@ -167,17 +166,12 @@ private void registerEnv(InternalMiniClusterExtension internalMiniClusterExtensi
                         .getOptional(CoreOptions.DEFAULT_PARALLELISM)
                         .orElse(internalMiniClusterExtension.getNumberSlots());
 
-        TestEnvironment executionEnvironment =
-                new TestEnvironment(
-                        internalMiniClusterExtension.getMiniCluster(), defaultParallelism, false);
-        executionEnvironment.setAsContext();
         TestStreamEnvironment.setAsContext(
                 internalMiniClusterExtension.getMiniCluster(), defaultParallelism);
     }
 
     private void unregisterEnv(InternalMiniClusterExtension internalMiniClusterExtension) {
         TestStreamEnvironment.unsetAsContext();
-        TestEnvironment.unsetAsContext();
     }
 
     private MiniClusterClient createMiniClusterClient(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
index 9c3170f9a96b1..0eac2ed2936e0 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/util/ReadWriteTableTestUtil.java
@@ -23,7 +23,6 @@
 import org.apache.paimon.utils.BlockingIterator;
 
 import org.apache.flink.api.common.RuntimeExecutionMode;
-import org.apache.flink.api.common.time.Time;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.configuration.RestartStrategyOptions;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
@@ -37,6 +36,7 @@
 import javax.annotation.Nullable;
 
 import java.nio.file.Paths;
+import java.time.Duration;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
@@ -53,7 +53,7 @@
 /** Test util for {@link ReadWriteTableITCase}. */
 public class ReadWriteTableTestUtil {
 
-    private static final Time TIME_OUT = Time.seconds(10);
+    private static final Duration TIME_OUT = Duration.ofSeconds(10);
 
     public static final int DEFAULT_PARALLELISM = 2;
 
@@ -278,7 +278,7 @@ public static void testBatchRead(String query, List<Row> expected) throws Except
         try (BlockingIterator<Row, Row> iterator = BlockingIterator.of(resultItr)) {
             if (!expected.isEmpty()) {
                 List<Row> result =
-                        iterator.collect(expected.size(), TIME_OUT.getSize(), TIME_OUT.getUnit());
+                        iterator.collect(expected.size(), TIME_OUT.getSeconds(), TimeUnit.SECONDS);
                 assertThat(toInsertOnlyRows(result))
                         .containsExactlyInAnyOrderElementsOf(toInsertOnlyRows(expected));
             }

From fe693135015c535f13cbc97b2b1a94bb17cbd6c0 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 27 Nov 2024 19:01:52 +0800
Subject: [PATCH 074/157] [core] Cache statistics in AbstractFileStoreTable
 (#4601)

---
 .../apache/paimon/catalog/CachingCatalog.java |  7 +++
 .../apache/paimon/stats/StatsFileHandler.java | 15 +++---
 .../paimon/table/AbstractFileStoreTable.java  | 47 +++++++++++++++++--
 .../paimon/table/DelegatedFileStoreTable.java |  5 ++
 .../apache/paimon/table/FileStoreTable.java   |  3 ++
 .../paimon/catalog/CachingCatalogTest.java    |  7 ++-
 .../paimon/flink/FlinkAnalyzeTableITCase.java | 15 +++++-
 7 files changed, 86 insertions(+), 13 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
index 1912ad60623cb..f67f19700d6e2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
@@ -265,6 +265,13 @@ private void putTableCache(Identifier identifier, Table table) {
                             .maximumSize(snapshotMaxNumPerTable)
                             .executor(Runnable::run)
                             .build());
+            storeTable.setStatsCache(
+                    Caffeine.newBuilder()
+                            .softValues()
+                            .expireAfterAccess(expirationInterval)
+                            .maximumSize(5)
+                            .executor(Runnable::run)
+                            .build());
             if (manifestCache != null) {
                 storeTable.setManifestCache(manifestCache);
             }
diff --git a/paimon-core/src/main/java/org/apache/paimon/stats/StatsFileHandler.java b/paimon-core/src/main/java/org/apache/paimon/stats/StatsFileHandler.java
index f9e057c7cbb32..5cb88f7257a7e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/stats/StatsFileHandler.java
+++ b/paimon-core/src/main/java/org/apache/paimon/stats/StatsFileHandler.java
@@ -71,13 +71,14 @@ public Optional<Statistics> readStats(long snapshotId) {
     }
 
     public Optional<Statistics> readStats(Snapshot snapshot) {
-        if (snapshot.statistics() == null) {
-            return Optional.empty();
-        } else {
-            Statistics stats = statsFile.read(snapshot.statistics());
-            stats.deserializeFieldsFromString(schemaManager.schema(stats.schemaId()));
-            return Optional.of(stats);
-        }
+        String file = snapshot.statistics();
+        return file == null ? Optional.empty() : Optional.of(readStats(file));
+    }
+
+    public Statistics readStats(String file) {
+        Statistics stats = statsFile.read(file);
+        stats.deserializeFieldsFromString(schemaManager.schema(stats.schemaId()));
+        return stats;
     }
 
     /** Delete stats of the specified snapshot. */
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
index 4180ff11c1677..57966d24ce474 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/AbstractFileStoreTable.java
@@ -92,6 +92,7 @@
 abstract class AbstractFileStoreTable implements FileStoreTable {
 
     private static final long serialVersionUID = 1L;
+
     private static final String WATERMARK_PREFIX = "watermark-";
 
     protected final FileIO fileIO;
@@ -99,6 +100,10 @@ abstract class AbstractFileStoreTable implements FileStoreTable {
     protected final TableSchema tableSchema;
     protected final CatalogEnvironment catalogEnvironment;
 
+    @Nullable protected transient SegmentsCache<Path> manifestCache;
+    @Nullable protected transient Cache<Path, Snapshot> snapshotCache;
+    @Nullable protected transient Cache<String, Statistics> statsCache;
+
     protected AbstractFileStoreTable(
             FileIO fileIO,
             Path path,
@@ -122,14 +127,21 @@ public String currentBranch() {
 
     @Override
     public void setManifestCache(SegmentsCache<Path> manifestCache) {
+        this.manifestCache = manifestCache;
         store().setManifestCache(manifestCache);
     }
 
     @Override
     public void setSnapshotCache(Cache<Path, Snapshot> cache) {
+        this.snapshotCache = cache;
         store().setSnapshotCache(cache);
     }
 
+    @Override
+    public void setStatsCache(Cache<String, Statistics> cache) {
+        this.statsCache = cache;
+    }
+
     @Override
     public OptionalLong latestSnapshotId() {
         Long snapshot = store().snapshotManager().latestSnapshotId();
@@ -187,7 +199,21 @@ public String uuid() {
     public Optional<Statistics> statistics() {
         Snapshot snapshot = TimeTravelUtil.resolveSnapshot(this);
         if (snapshot != null) {
-            return store().newStatsFileHandler().readStats(snapshot);
+            String file = snapshot.statistics();
+            if (file == null) {
+                return Optional.empty();
+            }
+            if (statsCache != null) {
+                Statistics stats = statsCache.getIfPresent(file);
+                if (stats != null) {
+                    return Optional.of(stats);
+                }
+            }
+            Statistics stats = store().newStatsFileHandler().readStats(file);
+            if (statsCache != null) {
+                statsCache.put(file, stats);
+            }
+            return Optional.of(stats);
         }
         return Optional.empty();
     }
@@ -342,9 +368,22 @@ public FileStoreTable copyWithLatestSchema() {
 
     @Override
     public FileStoreTable copy(TableSchema newTableSchema) {
-        return newTableSchema.primaryKeys().isEmpty()
-                ? new AppendOnlyFileStoreTable(fileIO, path, newTableSchema, catalogEnvironment)
-                : new PrimaryKeyFileStoreTable(fileIO, path, newTableSchema, catalogEnvironment);
+        AbstractFileStoreTable copied =
+                newTableSchema.primaryKeys().isEmpty()
+                        ? new AppendOnlyFileStoreTable(
+                                fileIO, path, newTableSchema, catalogEnvironment)
+                        : new PrimaryKeyFileStoreTable(
+                                fileIO, path, newTableSchema, catalogEnvironment);
+        if (snapshotCache != null) {
+            copied.setSnapshotCache(snapshotCache);
+        }
+        if (manifestCache != null) {
+            copied.setManifestCache(manifestCache);
+        }
+        if (statsCache != null) {
+            copied.setStatsCache(statsCache);
+        }
+        return copied;
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
index 624476b5b43e0..0a548941bedcd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/DelegatedFileStoreTable.java
@@ -130,6 +130,11 @@ public void setSnapshotCache(Cache<Path, Snapshot> cache) {
         wrapped.setSnapshotCache(cache);
     }
 
+    @Override
+    public void setStatsCache(Cache<String, Statistics> cache) {
+        wrapped.setStatsCache(cache);
+    }
+
     @Override
     public TableSchema schema() {
         return wrapped.schema();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
index d37e57e4e57ec..61aa77d5f36a5 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/FileStoreTable.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.ManifestCacheFilter;
 import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.stats.Statistics;
 import org.apache.paimon.table.query.LocalTableQuery;
 import org.apache.paimon.table.sink.RowKeyExtractor;
 import org.apache.paimon.table.sink.TableCommitImpl;
@@ -47,6 +48,8 @@ public interface FileStoreTable extends DataTable {
 
     void setSnapshotCache(Cache<Path, Snapshot> cache);
 
+    void setStatsCache(Cache<String, Statistics> cache);
+
     @Override
     default RowType rowType() {
         return schema().logicalRowType();
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
index e4f0a1510b8de..7567f682ae604 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
@@ -352,6 +352,10 @@ public void testSnapshotCache() throws Exception {
 
         Snapshot snapshot = table.snapshot(1);
         assertThat(snapshot).isSameAs(table.snapshot(1));
+
+        // copy
+        Snapshot copied = table.copy(Collections.singletonMap("a", "b")).snapshot(1);
+        assertThat(copied).isSameAs(snapshot);
     }
 
     @Test
@@ -386,7 +390,8 @@ private void innerTestManifestCache(long manifestCacheThreshold) throws Exceptio
 
         // repeat read
         for (int i = 0; i < 5; i++) {
-            table = catalog.getTable(tableIdent);
+            // test copy too
+            table = catalog.getTable(tableIdent).copy(Collections.singletonMap("a", "b"));
             ReadBuilder readBuilder = table.newReadBuilder();
             TableScan scan = readBuilder.newScan();
             TableRead read = readBuilder.newRead();
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkAnalyzeTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkAnalyzeTableITCase.java
index ad8a2d45a0368..e186080d9f45d 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkAnalyzeTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkAnalyzeTableITCase.java
@@ -22,11 +22,13 @@
 import org.apache.paimon.data.Decimal;
 import org.apache.paimon.stats.ColStats;
 import org.apache.paimon.stats.Statistics;
+import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.utils.DateTimeUtils;
 
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.Test;
 
+import java.util.Collections;
 import java.util.Map;
 import java.util.Optional;
 
@@ -51,7 +53,8 @@ public void testAnalyzeTable() throws Catalog.TableNotExistException {
         sql("INSERT INTO T VALUES ('2', 'aaa', 1, 2)");
         sql("ANALYZE TABLE T COMPUTE STATISTICS");
 
-        Optional<Statistics> statisticsOpt = paimonTable("T").statistics();
+        FileStoreTable table = paimonTable("T");
+        Optional<Statistics> statisticsOpt = table.statistics();
         assertThat(statisticsOpt.isPresent()).isTrue();
         Statistics stats = statisticsOpt.get();
 
@@ -60,6 +63,16 @@ public void testAnalyzeTable() throws Catalog.TableNotExistException {
 
         Assertions.assertTrue(stats.mergedRecordSize().isPresent());
         Assertions.assertTrue(stats.colStats().isEmpty());
+
+        // by default, caching catalog should cache it
+        Optional<Statistics> newStats = table.statistics();
+        assertThat(newStats.isPresent()).isTrue();
+        assertThat(newStats.get()).isSameAs(stats);
+
+        // copy the table
+        newStats = table.copy(Collections.singletonMap("a", "b")).statistics();
+        assertThat(newStats.isPresent()).isTrue();
+        assertThat(newStats.get()).isSameAs(stats);
     }
 
     @Test

From 4bcf8576b3a5af66adb47dba7b8427581d080aab Mon Sep 17 00:00:00 2001
From: HunterXHunter <1356469429@qq.com>
Date: Wed, 27 Nov 2024 19:11:39 +0800
Subject: [PATCH 075/157] [flink] Support minor compact strategy for dedicated
 compaction action. (#4589)

---
 docs/content/flink/procedures.md              |  15 +-
 .../maintenance/dedicated-compaction.md       |   8 +
 docs/content/spark/procedures.md              |   4 +-
 .../procedure/CompactDatabaseProcedure.java   |  13 +-
 .../flink/procedure/CompactProcedure.java     |  16 +-
 .../ProcedurePositionalArgumentsITCase.java   |   8 +-
 .../paimon/flink/action/ActionFactory.java    |   4 +
 .../paimon/flink/action/CompactAction.java    |  17 +-
 .../flink/action/CompactActionFactory.java    |  24 +-
 .../flink/action/CompactDatabaseAction.java   |  47 ++--
 .../action/CompactDatabaseActionFactory.java  |  15 +-
 .../procedure/CompactDatabaseProcedure.java   |  13 +-
 .../flink/procedure/CompactProcedure.java     |  13 +-
 .../sink/CombinedTableCompactorSink.java      |  17 +-
 .../flink/sink/CompactorSinkBuilder.java      |  10 +-
 .../sink/MultiTablesStoreCompactOperator.java |   6 +-
 .../flink/action/CompactActionITCase.java     |  35 ---
 .../flink/action/CompactActionITCaseBase.java |  36 +++
 .../action/MinorCompactActionITCase.java      | 205 ++++++++++++++++++
 .../procedure/CompactProcedureITCase.java     | 112 ++++++++++
 .../flink/sink/CompactorSinkITCase.java       |  14 +-
 .../spark/procedure/CompactProcedure.java     |  35 ++-
 .../procedure/CompactProcedureTestBase.scala  |  50 +++++
 23 files changed, 622 insertions(+), 95 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/MinorCompactActionITCase.java

diff --git a/docs/content/flink/procedures.md b/docs/content/flink/procedures.md
index 7e669a89d43bf..59b02f82bf8c0 100644
--- a/docs/content/flink/procedures.md
+++ b/docs/content/flink/procedures.md
@@ -67,7 +67,8 @@ All available procedures are listed below.
             order_by => 'order_by', 
             options => 'options', 
             `where` => 'where', 
-            partition_idle_time => 'partition_idle_time') <br/><br/>
+            partition_idle_time => 'partition_idle_time',
+            compact_strategy => 'compact_strategy') <br/><br/>
          -- Use indexed argument<br/>
          CALL [catalog.]sys.compact('table') <br/><br/>
          CALL [catalog.]sys.compact('table', 'partitions') <br/><br/> 
@@ -76,6 +77,7 @@ All available procedures are listed below.
          CALL [catalog.]sys.compact('table', 'partitions', 'order_strategy', 'order_by', 'options') <br/><br/>
          CALL [catalog.]sys.compact('table', 'partitions', 'order_strategy', 'order_by', 'options', 'where') <br/><br/>
          CALL [catalog.]sys.compact('table', 'partitions', 'order_strategy', 'order_by', 'options', 'where', 'partition_idle_time') <br/><br/>
+         CALL [catalog.]sys.compact('table', 'partitions', 'order_strategy', 'order_by', 'options', 'where', 'partition_idle_time', 'compact_strategy') <br/><br/>
       </td>
       <td>
          To compact a table. Arguments:
@@ -86,6 +88,7 @@ All available procedures are listed below.
             <li>options(optional): additional dynamic options of the table.</li>
             <li>where(optional): partition predicate(Can't be used together with "partitions"). Note: as where is a keyword,a pair of backticks need to add around like `where`.</li>
             <li>partition_idle_time(optional): this is used to do a full compaction for partition which had not received any new data for 'partition_idle_time'. And only these partitions will be compacted. This argument can not be used with order compact.</li>
+            <li>compact_strategy(optional): this determines how to pick files to be merged, the default is determined by the runtime execution mode. 'full' strategy only supports batch mode. All files will be selected for merging. 'minor' strategy: Pick the set of files that need to be merged based on specified conditions.</li>
       </td>
       <td>
          -- use partition filter <br/>
@@ -104,7 +107,8 @@ All available procedures are listed below.
             including_tables => 'includingTables', 
             excluding_tables => 'excludingTables', 
             table_options => 'tableOptions', 
-            partition_idle_time => 'partitionIdleTime') <br/><br/>
+            partition_idle_time => 'partitionIdleTime',
+            compact_strategy => 'compact_strategy') <br/><br/>
          -- Use indexed argument<br/>
          CALL [catalog.]sys.compact_database() <br/><br/>
          CALL [catalog.]sys.compact_database('includingDatabases') <br/><br/> 
@@ -112,7 +116,8 @@ All available procedures are listed below.
          CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables') <br/><br/> 
          CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables') <br/><br/>
          CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables', 'tableOptions') <br/><br/>
-         CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables', 'tableOptions', 'partitionIdleTime')
+         CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables', 'tableOptions', 'partitionIdleTime')<br/><br/>
+         CALL [catalog.]sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables', 'tableOptions', 'partitionIdleTime', 'compact_strategy')<br/><br/>
       </td>
       <td>
          To compact databases. Arguments:
@@ -124,6 +129,7 @@ All available procedures are listed below.
             <li>excludingTables: to specify tables that are not compacted. You can use regular expression.</li>
             <li>tableOptions: additional dynamic options of the table.</li>
             <li>partition_idle_time: this is used to do a full compaction for partition which had not received any new data for 'partition_idle_time'. And only these partitions will be compacted.</li>
+            <li>compact_strategy(optional): this determines how to pick files to be merged, the default is determined by the runtime execution mode. 'full' strategy only supports batch mode. All files will be selected for merging. 'minor' strategy: Pick the set of files that need to be merged based on specified conditions.</li>
       </td>
       <td>
          CALL sys.compact_database(
@@ -131,7 +137,8 @@ All available procedures are listed below.
             mode => 'combined', 
             including_tables => 'table_.*', 
             excluding_tables => 'ignore', 
-            table_options => 'sink.parallelism=4')
+            table_options => 'sink.parallelism=4',
+            compat_strategy => 'full')
       </td>
    </tr>
    <tr>
diff --git a/docs/content/maintenance/dedicated-compaction.md b/docs/content/maintenance/dedicated-compaction.md
index c0010bf9cc854..63e0aa5e66e4b 100644
--- a/docs/content/maintenance/dedicated-compaction.md
+++ b/docs/content/maintenance/dedicated-compaction.md
@@ -107,6 +107,7 @@ Run the following command to submit a compaction job for the table.
     --database <database-name> \ 
     --table <table-name> \
     [--partition <partition-name>] \
+    [--compact_strategy <minor / full>] \
     [--table_conf <table_conf>] \
     [--catalog_conf <paimon-catalog-conf> [--catalog_conf <paimon-catalog-conf> ...]]
 ```
@@ -123,10 +124,14 @@ Example: compact table
     --partition dt=20221126,hh=08 \
     --partition dt=20221127,hh=09 \
     --table_conf sink.parallelism=10 \
+    --compact_strategy minor \
     --catalog_conf s3.endpoint=https://****.com \
     --catalog_conf s3.access-key=***** \
     --catalog_conf s3.secret-key=*****
 ```
+* `--compact_strategy` Determines how to pick files to be merged, the default is determined by the runtime execution mode, streaming-mode use `minor` strategy and batch-mode use `full` strategy.
+  * `full` : Only supports batch mode. All files will be selected for merging.
+  * `minor` : Pick the set of files that need to be merged based on specified conditions.
 
 You can use `-D execution.runtime-mode=batch` or `-yD execution.runtime-mode=batch` (for the ON-YARN scenario) to control batch or streaming mode. If you submit a batch job, all
 current table files will be compacted. If you submit a streaming job, the job will continuously monitor new changes
@@ -190,6 +195,7 @@ CALL sys.compact_database(
     [--including_tables <paimon-table-name|name-regular-expr>] \
     [--excluding_tables <paimon-table-name|name-regular-expr>] \
     [--mode <compact-mode>] \
+    [--compact_strategy <minor / full>] \
     [--catalog_conf <paimon-catalog-conf> [--catalog_conf <paimon-catalog-conf> ...]] \
     [--table_conf <paimon-table_conf> [--table_conf <paimon-table_conf> ...]]
 ```
@@ -346,6 +352,7 @@ CALL sys.compact(`table` => 'default.T', 'partition_idle_time' => '1 d')
     --table <table-name> \
     --partition_idle_time <partition-idle-time> \ 
     [--partition <partition-name>] \
+    [--compact_strategy <minor / full>] \
     [--catalog_conf <paimon-catalog-conf> [--catalog_conf <paimon-catalog-conf> ...]] \
     [--table_conf <paimon-table-dynamic-conf> [--table_conf <paimon-table-dynamic-conf>] ...]
 ```
@@ -406,6 +413,7 @@ CALL sys.compact_database(
     [--including_tables <paimon-table-name|name-regular-expr>] \
     [--excluding_tables <paimon-table-name|name-regular-expr>] \
     [--mode <compact-mode>] \
+    [--compact_strategy <minor / full>] \
     [--catalog_conf <paimon-catalog-conf> [--catalog_conf <paimon-catalog-conf> ...]] \
     [--table_conf <paimon-table_conf> [--table_conf <paimon-table_conf> ...]]
 ```
diff --git a/docs/content/spark/procedures.md b/docs/content/spark/procedures.md
index 1f3f554106ec5..88d46fabbb2bc 100644
--- a/docs/content/spark/procedures.md
+++ b/docs/content/spark/procedures.md
@@ -47,12 +47,14 @@ This section introduce all available spark procedures about paimon.
             <li>order_strategy: 'order' or 'zorder' or 'hilbert' or 'none'. Left empty for 'none'.</li>
             <li>order_columns: the columns need to be sort. Left empty if 'order_strategy' is 'none'.</li>
             <li>partition_idle_time: this is used to do a full compaction for partition which had not received any new data for 'partition_idle_time'. And only these partitions will be compacted. This argument can not be used with order compact.</li>
+            <li>compact_strategy: this determines how to pick files to be merged, the default is determined by the runtime execution mode. 'full' strategy only supports batch mode. All files will be selected for merging. 'minor' strategy: Pick the set of files that need to be merged based on specified conditions.</li>
       </td>
       <td>
          SET spark.sql.shuffle.partitions=10; --set the compact parallelism <br/><br/>
          CALL sys.compact(table => 'T', partitions => 'p=0;p=1',  order_strategy => 'zorder', order_by => 'a,b') <br/><br/>
          CALL sys.compact(table => 'T', where => 'p>0 and p<3', order_strategy => 'zorder', order_by => 'a,b') <br/><br/>
-         CALL sys.compact(table => 'T', partition_idle_time => '60s')
+         CALL sys.compact(table => 'T', partition_idle_time => '60s')<br/><br/>
+         CALL sys.compact(table => 'T', compact_strategy => 'minor')<br/><br/>
       </td>
     </tr>
     <tr>
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
index 99f205bacb58e..ac4340c113365 100644
--- a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
@@ -26,6 +26,8 @@
 
 import java.util.Map;
 
+import static org.apache.paimon.flink.action.ActionFactory.FULL;
+import static org.apache.paimon.flink.action.CompactActionFactory.checkCompactStrategy;
 import static org.apache.paimon.utils.ParameterUtils.parseCommaSeparatedKeyValues;
 
 /**
@@ -51,6 +53,7 @@
  *
  *  -- set table options ('k=v,...')
  *  CALL sys.compact_database('includingDatabases', 'mode', 'includingTables', 'excludingTables', 'tableOptions')
+ *
  * </code></pre>
  */
 public class CompactDatabaseProcedure extends ProcedureBase {
@@ -106,7 +109,8 @@ public String[] call(
                 includingTables,
                 excludingTables,
                 tableOptions,
-                "");
+                "",
+                null);
     }
 
     public String[] call(
@@ -116,7 +120,8 @@ public String[] call(
             String includingTables,
             String excludingTables,
             String tableOptions,
-            String partitionIdleTime)
+            String partitionIdleTime,
+            String compactStrategy)
             throws Exception {
         String warehouse = catalog.warehouse();
         Map<String, String> catalogOptions = catalog.options();
@@ -133,6 +138,10 @@ public String[] call(
             action.withPartitionIdleTime(TimeUtils.parseDuration(partitionIdleTime));
         }
 
+        if (checkCompactStrategy(compactStrategy)) {
+            action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+        }
+
         return execute(procedureContext, action, "Compact database job");
     }
 
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
index 63aa6c906b947..560e532a6dbb3 100644
--- a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
@@ -31,6 +31,9 @@
 import java.util.Collections;
 import java.util.Map;
 
+import static org.apache.paimon.flink.action.ActionFactory.FULL;
+import static org.apache.paimon.flink.action.CompactActionFactory.checkCompactStrategy;
+
 /**
  * Stay compatible with 1.18 procedure which doesn't support named argument. Usage:
  *
@@ -49,6 +52,9 @@
  *  -- compact specific partitions with sorting
  *  CALL sys.compact('tableId', 'partitions', 'ORDER/ZORDER', 'col1,col2', 'sink.parallelism=6')
  *
+ *  -- compact with specific compact strategy
+ *  CALL sys.compact('tableId', 'partitions', 'ORDER/ZORDER', 'col1,col2', 'sink.parallelism=6', 'minor')
+ *
  * </code></pre>
  */
 public class CompactProcedure extends ProcedureBase {
@@ -118,7 +124,8 @@ public String[] call(
                 orderByColumns,
                 tableOptions,
                 whereSql,
-                "");
+                "",
+                null);
     }
 
     public String[] call(
@@ -129,7 +136,8 @@ public String[] call(
             String orderByColumns,
             String tableOptions,
             String whereSql,
-            String partitionIdleTime)
+            String partitionIdleTime,
+            String compactStrategy)
             throws Exception {
 
         String warehouse = catalog.warehouse();
@@ -152,6 +160,10 @@ public String[] call(
             if (!(StringUtils.isNullOrWhitespaceOnly(partitionIdleTime))) {
                 action.withPartitionIdleTime(TimeUtils.parseDuration(partitionIdleTime));
             }
+
+            if (checkCompactStrategy(compactStrategy)) {
+                action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+            }
             jobName = "Compact Job";
         } else if (!orderStrategy.isEmpty() && !orderByColumns.isEmpty()) {
             Preconditions.checkArgument(
diff --git a/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/procedure/ProcedurePositionalArgumentsITCase.java b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/procedure/ProcedurePositionalArgumentsITCase.java
index f2385e66d2a1d..f79d6fb716b4c 100644
--- a/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/procedure/ProcedurePositionalArgumentsITCase.java
+++ b/paimon-flink/paimon-flink-1.18/src/test/java/org/apache/paimon/flink/procedure/ProcedurePositionalArgumentsITCase.java
@@ -68,10 +68,16 @@ public void testCompactDatabaseAndTable() {
                                 sql(
                                         "CALL sys.compact('default.T', '', '', '', 'sink.parallelism=1','pt=1')"))
                 .doesNotThrowAnyException();
-        assertThatCode(() -> sql("CALL sys.compact('default.T', '', 'zorder', 'k', '','','5s')"))
+        assertThatCode(
+                        () ->
+                                sql(
+                                        "CALL sys.compact('default.T', '' ,'zorder', 'k', '','','5s', '')"))
                 .message()
                 .contains("sort compact do not support 'partition_idle_time'.");
 
+        assertThatCode(() -> sql("CALL sys.compact('default.T', '', '' ,'', '', '', '', 'full')"))
+                .doesNotThrowAnyException();
+
         assertThatCode(() -> sql("CALL sys.compact_database('default')"))
                 .doesNotThrowAnyException();
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ActionFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ActionFactory.java
index 43719f715d9de..fbf8f12f49eb6 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ActionFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ActionFactory.java
@@ -58,6 +58,10 @@ public interface ActionFactory extends Factory {
     String TIMESTAMPFORMATTER = "timestamp_formatter";
     String EXPIRE_STRATEGY = "expire_strategy";
     String TIMESTAMP_PATTERN = "timestamp_pattern";
+    // Supports `full` and `minor`.
+    String COMPACT_STRATEGY = "compact_strategy";
+    String MINOR = "minor";
+    String FULL = "full";
 
     Optional<Action> create(MultipleParameterToolAdapter params);
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
index ce88857f1b141..84e37a5b10f9c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactAction.java
@@ -59,6 +59,8 @@ public class CompactAction extends TableActionBase {
 
     @Nullable private Duration partitionIdleTime = null;
 
+    private Boolean fullCompaction;
+
     public CompactAction(String warehouse, String database, String tableName) {
         this(warehouse, database, tableName, Collections.emptyMap(), Collections.emptyMap());
     }
@@ -100,6 +102,11 @@ public CompactAction withPartitionIdleTime(@Nullable Duration partitionIdleTime)
         return this;
     }
 
+    public CompactAction withFullCompaction(Boolean fullCompaction) {
+        this.fullCompaction = fullCompaction;
+        return this;
+    }
+
     @Override
     public void build() throws Exception {
         ReadableConfig conf = env.getConfiguration();
@@ -124,6 +131,13 @@ public void build() throws Exception {
     private void buildForTraditionalCompaction(
             StreamExecutionEnvironment env, FileStoreTable table, boolean isStreaming)
             throws Exception {
+        if (fullCompaction == null) {
+            fullCompaction = !isStreaming;
+        } else {
+            Preconditions.checkArgument(
+                    !(fullCompaction && isStreaming),
+                    "The full compact strategy is only supported in batch mode. Please add -Dexecution.runtime-mode=BATCH.");
+        }
         if (isStreaming) {
             // for completely asynchronous compaction
             HashMap<String, String> dynamicOptions =
@@ -138,8 +152,7 @@ private void buildForTraditionalCompaction(
         }
         CompactorSourceBuilder sourceBuilder =
                 new CompactorSourceBuilder(identifier.getFullName(), table);
-        CompactorSinkBuilder sinkBuilder =
-                new CompactorSinkBuilder(table).withFullCompaction(!isStreaming);
+        CompactorSinkBuilder sinkBuilder = new CompactorSinkBuilder(table, fullCompaction);
 
         sourceBuilder.withPartitionPredicate(getPredicate());
         DataStreamSource<RowData> source =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactActionFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactActionFactory.java
index f43c7a747c990..fc60a870eabe1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactActionFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactActionFactory.java
@@ -76,6 +76,10 @@ public Optional<Action> create(MultipleParameterToolAdapter params) {
                 action.withPartitionIdleTime(
                         TimeUtils.parseDuration(params.get(PARTITION_IDLE_TIME)));
             }
+            String compactStrategy = params.get(COMPACT_STRATEGY);
+            if (checkCompactStrategy(compactStrategy)) {
+                action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+            }
         }
 
         if (params.has(PARTITION)) {
@@ -88,6 +92,19 @@ public Optional<Action> create(MultipleParameterToolAdapter params) {
         return Optional.of(action);
     }
 
+    public static boolean checkCompactStrategy(String compactStrategy) {
+        if (compactStrategy != null) {
+            Preconditions.checkArgument(
+                    compactStrategy.equalsIgnoreCase(MINOR)
+                            || compactStrategy.equalsIgnoreCase(FULL),
+                    String.format(
+                            "The compact strategy only supports 'full' or 'minor', but '%s' is configured.",
+                            compactStrategy));
+            return true;
+        }
+        return false;
+    }
+
     @Override
     public void printHelp() {
         System.out.println(
@@ -101,7 +118,8 @@ public void printHelp() {
                         + "[--order_strategy <order_strategy>]"
                         + "[--table_conf <key>=<value>]"
                         + "[--order_by <order_columns>]"
-                        + "[--partition_idle_time <partition_idle_time>]");
+                        + "[--partition_idle_time <partition_idle_time>]"
+                        + "[--compact_strategy <compact_strategy>]");
         System.out.println(
                 "  compact --warehouse s3://path/to/warehouse --database <database_name> "
                         + "--table <table_name> [--catalog_conf <paimon_catalog_conf> [--catalog_conf <paimon_catalog_conf> ...]]");
@@ -132,6 +150,10 @@ public void printHelp() {
         System.out.println(
                 "  compact --warehouse hdfs:///path/to/warehouse --database test_db --table test_table "
                         + "--partition_idle_time 10s");
+        System.out.println(
+                "--compact_strategy determines how to pick files to be merged, the default is determined by the runtime execution mode. "
+                        + "`full` : Only supports batch mode. All files will be selected for merging."
+                        + "`minor`: Pick the set of files that need to be merged based on specified conditions.");
         System.out.println(
                 "  compact --warehouse s3:///path/to/warehouse "
                         + "--database test_db "
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
index 471c6fdd4da69..124d3ca687761 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseAction.java
@@ -72,6 +72,10 @@ public class CompactDatabaseAction extends ActionBase {
 
     @Nullable private Duration partitionIdleTime = null;
 
+    private Boolean fullCompaction;
+
+    private boolean isStreaming;
+
     public CompactDatabaseAction(String warehouse, Map<String, String> catalogConfig) {
         super(warehouse, catalogConfig);
     }
@@ -110,6 +114,11 @@ public CompactDatabaseAction withPartitionIdleTime(@Nullable Duration partitionI
         return this;
     }
 
+    public CompactDatabaseAction withFullCompaction(boolean fullCompaction) {
+        this.fullCompaction = fullCompaction;
+        return this;
+    }
+
     private boolean shouldCompactionTable(String paimonFullTableName) {
         boolean shouldCompaction = includingPattern.matcher(paimonFullTableName).matches();
         if (excludingPattern != null) {
@@ -124,6 +133,12 @@ private boolean shouldCompactionTable(String paimonFullTableName) {
 
     @Override
     public void build() {
+        ReadableConfig conf = env.getConfiguration();
+        isStreaming = conf.get(ExecutionOptions.RUNTIME_MODE) == RuntimeExecutionMode.STREAMING;
+
+        if (fullCompaction == null) {
+            fullCompaction = !isStreaming;
+        }
         if (databaseCompactMode == MultiTablesSinkMode.DIVIDED) {
             buildForDividedMode();
         } else {
@@ -170,24 +185,19 @@ private void buildForDividedMode() {
                 !tableMap.isEmpty(),
                 "no tables to be compacted. possible cause is that there are no tables detected after pattern matching");
 
-        ReadableConfig conf = env.getConfiguration();
-        boolean isStreaming =
-                conf.get(ExecutionOptions.RUNTIME_MODE) == RuntimeExecutionMode.STREAMING;
         for (Map.Entry<String, FileStoreTable> entry : tableMap.entrySet()) {
             FileStoreTable fileStoreTable = entry.getValue();
             switch (fileStoreTable.bucketMode()) {
                 case BUCKET_UNAWARE:
                     {
-                        buildForUnawareBucketCompaction(
-                                env, entry.getKey(), fileStoreTable, isStreaming);
+                        buildForUnawareBucketCompaction(env, entry.getKey(), fileStoreTable);
                         break;
                     }
                 case HASH_FIXED:
                 case HASH_DYNAMIC:
                 default:
                     {
-                        buildForTraditionalCompaction(
-                                env, entry.getKey(), fileStoreTable, isStreaming);
+                        buildForTraditionalCompaction(env, entry.getKey(), fileStoreTable);
                     }
             }
         }
@@ -195,9 +205,6 @@ private void buildForDividedMode() {
 
     private void buildForCombinedMode() {
 
-        ReadableConfig conf = env.getConfiguration();
-        boolean isStreaming =
-                conf.get(ExecutionOptions.RUNTIME_MODE) == RuntimeExecutionMode.STREAMING;
         CombinedTableCompactorSourceBuilder sourceBuilder =
                 new CombinedTableCompactorSourceBuilder(
                                 catalogLoader(),
@@ -234,15 +241,17 @@ private void buildForCombinedMode() {
                                 .buildForUnawareBucketsTableSource(),
                         parallelism);
 
-        new CombinedTableCompactorSink(catalogLoader(), tableOptions)
+        new CombinedTableCompactorSink(catalogLoader(), tableOptions, fullCompaction)
                 .sinkFrom(awareBucketTableSource, unawareBucketTableSource);
     }
 
     private void buildForTraditionalCompaction(
-            StreamExecutionEnvironment env,
-            String fullName,
-            FileStoreTable table,
-            boolean isStreaming) {
+            StreamExecutionEnvironment env, String fullName, FileStoreTable table) {
+
+        Preconditions.checkArgument(
+                !(fullCompaction && isStreaming),
+                "The full compact strategy is only supported in batch mode. Please add -Dexecution.runtime-mode=BATCH.");
+
         if (isStreaming) {
             // for completely asynchronous compaction
             HashMap<String, String> dynamicOptions =
@@ -259,8 +268,7 @@ private void buildForTraditionalCompaction(
         CompactorSourceBuilder sourceBuilder =
                 new CompactorSourceBuilder(fullName, table)
                         .withPartitionIdleTime(partitionIdleTime);
-        CompactorSinkBuilder sinkBuilder =
-                new CompactorSinkBuilder(table).withFullCompaction(!isStreaming);
+        CompactorSinkBuilder sinkBuilder = new CompactorSinkBuilder(table, fullCompaction);
 
         DataStreamSource<RowData> source =
                 sourceBuilder.withEnv(env).withContinuousMode(isStreaming).build();
@@ -268,10 +276,7 @@ private void buildForTraditionalCompaction(
     }
 
     private void buildForUnawareBucketCompaction(
-            StreamExecutionEnvironment env,
-            String fullName,
-            FileStoreTable table,
-            boolean isStreaming) {
+            StreamExecutionEnvironment env, String fullName, FileStoreTable table) {
         UnawareBucketCompactionTopoBuilder unawareBucketCompactionTopoBuilder =
                 new UnawareBucketCompactionTopoBuilder(env, fullName, table);
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseActionFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseActionFactory.java
index b268709078093..5672f99dc30f3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseActionFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CompactDatabaseActionFactory.java
@@ -22,6 +22,8 @@
 
 import java.util.Optional;
 
+import static org.apache.paimon.flink.action.CompactActionFactory.checkCompactStrategy;
+
 /** Factory to create {@link CompactDatabaseAction}. */
 public class CompactDatabaseActionFactory implements ActionFactory {
 
@@ -55,6 +57,11 @@ public Optional<Action> create(MultipleParameterToolAdapter params) {
             action.withPartitionIdleTime(TimeUtils.parseDuration(partitionIdleTime));
         }
 
+        String compactStrategy = params.get(COMPACT_STRATEGY);
+        if (checkCompactStrategy(compactStrategy)) {
+            action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+        }
+
         return Optional.of(action);
     }
 
@@ -70,7 +77,8 @@ public void printHelp() {
                         + "[--including_tables <paimon_table_name|name_regular_expr>] "
                         + "[--excluding_tables <paimon_table_name|name_regular_expr>] "
                         + "[--mode <compact_mode>]"
-                        + "[--partition_idle_time <partition_idle_time>]");
+                        + "[--partition_idle_time <partition_idle_time>]"
+                        + "[--compact_strategy <compact_strategy>]");
         System.out.println(
                 "  compact_database --warehouse s3://path/to/warehouse --including_databases <database-name|name-regular-expr> "
                         + "[--catalog_conf <paimon_catalog_conf> [--catalog_conf <paimon_catalog_conf> ...]]");
@@ -93,6 +101,11 @@ public void printHelp() {
         System.out.println(
                 "--partition_idle_time is used to do a full compaction for partition which had not receive any new data for 'partition_idle_time' time. And only these partitions will be compacted.");
         System.out.println("--partition_idle_time is only supported in batch mode. ");
+        System.out.println(
+                "--compact_strategy determines how to pick files to be merged, the default is determined by the runtime execution mode. "
+                        + "`full` : Only supports batch mode. All files will be selected for merging."
+                        + "`minor`: Pick the set of files that need to be merged based on specified conditions.");
+
         System.out.println();
 
         System.out.println("Examples:");
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
index dd71e974c7b16..80602b755aa59 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactDatabaseProcedure.java
@@ -29,6 +29,8 @@
 
 import java.util.Map;
 
+import static org.apache.paimon.flink.action.ActionFactory.FULL;
+import static org.apache.paimon.flink.action.CompactActionFactory.checkCompactStrategy;
 import static org.apache.paimon.utils.ParameterUtils.parseCommaSeparatedKeyValues;
 
 /**
@@ -82,6 +84,10 @@ public class CompactDatabaseProcedure extends ProcedureBase {
                 @ArgumentHint(
                         name = "partition_idle_time",
                         type = @DataTypeHint("STRING"),
+                        isOptional = true),
+                @ArgumentHint(
+                        name = "compact_strategy",
+                        type = @DataTypeHint("STRING"),
                         isOptional = true)
             })
     public String[] call(
@@ -91,7 +97,8 @@ public String[] call(
             String includingTables,
             String excludingTables,
             String tableOptions,
-            String partitionIdleTime)
+            String partitionIdleTime,
+            String compactStrategy)
             throws Exception {
         partitionIdleTime = notnull(partitionIdleTime);
         String warehouse = catalog.warehouse();
@@ -109,6 +116,10 @@ public String[] call(
             action.withPartitionIdleTime(TimeUtils.parseDuration(partitionIdleTime));
         }
 
+        if (checkCompactStrategy(compactStrategy)) {
+            action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+        }
+
         return execute(procedureContext, action, "Compact database job");
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
index 8589069126988..282f5af340432 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/CompactProcedure.java
@@ -32,6 +32,8 @@
 import java.util.Collections;
 import java.util.Map;
 
+import static org.apache.paimon.flink.action.ActionFactory.FULL;
+import static org.apache.paimon.flink.action.CompactActionFactory.checkCompactStrategy;
 import static org.apache.paimon.utils.ParameterUtils.getPartitions;
 import static org.apache.paimon.utils.ParameterUtils.parseCommaSeparatedKeyValues;
 import static org.apache.paimon.utils.StringUtils.isNullOrWhitespaceOnly;
@@ -58,6 +60,10 @@ public class CompactProcedure extends ProcedureBase {
                 @ArgumentHint(
                         name = "partition_idle_time",
                         type = @DataTypeHint("STRING"),
+                        isOptional = true),
+                @ArgumentHint(
+                        name = "compact_strategy",
+                        type = @DataTypeHint("STRING"),
                         isOptional = true)
             })
     public String[] call(
@@ -68,7 +74,8 @@ public String[] call(
             String orderByColumns,
             String tableOptions,
             String where,
-            String partitionIdleTime)
+            String partitionIdleTime,
+            String compactStrategy)
             throws Exception {
         String warehouse = catalog.warehouse();
         Map<String, String> catalogOptions = catalog.options();
@@ -90,6 +97,10 @@ public String[] call(
             if (!isNullOrWhitespaceOnly(partitionIdleTime)) {
                 action.withPartitionIdleTime(TimeUtils.parseDuration(partitionIdleTime));
             }
+
+            if (checkCompactStrategy(compactStrategy)) {
+                action.withFullCompaction(compactStrategy.trim().equalsIgnoreCase(FULL));
+            }
             jobName = "Compact Job";
         } else if (!isNullOrWhitespaceOnly(orderStrategy)
                 && !isNullOrWhitespaceOnly(orderByColumns)) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
index 87a28091fa302..ce4e37305909a 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
@@ -57,11 +57,15 @@ public class CombinedTableCompactorSink implements Serializable {
 
     private final Catalog.Loader catalogLoader;
     private final boolean ignorePreviousFiles;
+    private final boolean fullCompaction;
+
     private final Options options;
 
-    public CombinedTableCompactorSink(Catalog.Loader catalogLoader, Options options) {
+    public CombinedTableCompactorSink(
+            Catalog.Loader catalogLoader, Options options, boolean fullCompaction) {
         this.catalogLoader = catalogLoader;
         this.ignorePreviousFiles = false;
+        this.fullCompaction = fullCompaction;
         this.options = options;
     }
 
@@ -104,7 +108,10 @@ public DataStream<MultiTableCommittable> doWrite(
                                 String.format("%s-%s", "Multi-Bucket-Table", WRITER_NAME),
                                 new MultiTableCommittableTypeInfo(),
                                 combinedMultiComacptionWriteOperator(
-                                        env.getCheckpointConfig(), isStreaming, commitUser))
+                                        env.getCheckpointConfig(),
+                                        isStreaming,
+                                        fullCompaction,
+                                        commitUser))
                         .setParallelism(awareBucketTableSource.getParallelism());
 
         SingleOutputStreamOperator<MultiTableCommittable> unawareBucketTableRewriter =
@@ -168,13 +175,17 @@ protected DataStreamSink<?> doCommit(
     // TODO:refactor FlinkSink to adopt this sink
     protected OneInputStreamOperator<RowData, MultiTableCommittable>
             combinedMultiComacptionWriteOperator(
-                    CheckpointConfig checkpointConfig, boolean isStreaming, String commitUser) {
+                    CheckpointConfig checkpointConfig,
+                    boolean isStreaming,
+                    boolean fullCompaction,
+                    String commitUser) {
         return new MultiTablesStoreCompactOperator(
                 catalogLoader,
                 commitUser,
                 checkpointConfig,
                 isStreaming,
                 ignorePreviousFiles,
+                fullCompaction,
                 options);
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
index 2173b1d34a72e..2d84ae6726fd2 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSinkBuilder.java
@@ -37,10 +37,11 @@ public class CompactorSinkBuilder {
 
     private DataStream<RowData> input;
 
-    private boolean fullCompaction;
+    private final boolean fullCompaction;
 
-    public CompactorSinkBuilder(FileStoreTable table) {
+    public CompactorSinkBuilder(FileStoreTable table, boolean fullCompaction) {
         this.table = table;
+        this.fullCompaction = fullCompaction;
     }
 
     public CompactorSinkBuilder withInput(DataStream<RowData> input) {
@@ -48,11 +49,6 @@ public CompactorSinkBuilder withInput(DataStream<RowData> input) {
         return this;
     }
 
-    public CompactorSinkBuilder withFullCompaction(boolean fullCompaction) {
-        this.fullCompaction = fullCompaction;
-        return this;
-    }
-
     public DataStreamSink<?> build() {
         BucketMode bucketMode = table.bucketMode();
         switch (bucketMode) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
index 8a1d3a02df811..57d2e8413cb5b 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
@@ -63,6 +63,7 @@ public class MultiTablesStoreCompactOperator
     private final CheckpointConfig checkpointConfig;
     private final boolean isStreaming;
     private final boolean ignorePreviousFiles;
+    private final boolean fullCompaction;
     private final String initialCommitUser;
 
     private transient StoreSinkWriteState state;
@@ -81,6 +82,7 @@ public MultiTablesStoreCompactOperator(
             CheckpointConfig checkpointConfig,
             boolean isStreaming,
             boolean ignorePreviousFiles,
+            boolean fullCompaction,
             Options options) {
         super(options);
         this.catalogLoader = catalogLoader;
@@ -88,6 +90,7 @@ public MultiTablesStoreCompactOperator(
         this.checkpointConfig = checkpointConfig;
         this.isStreaming = isStreaming;
         this.ignorePreviousFiles = ignorePreviousFiles;
+        this.fullCompaction = fullCompaction;
     }
 
     @Override
@@ -162,13 +165,14 @@ public void processElement(StreamRecord<RowData> element) throws Exception {
 
         if (write.streamingMode()) {
             write.notifyNewFiles(snapshotId, partition, bucket, files);
+            // The full compact is not supported in streaming mode.
             write.compact(partition, bucket, false);
         } else {
             Preconditions.checkArgument(
                     files.isEmpty(),
                     "Batch compact job does not concern what files are compacted. "
                             + "They only need to know what buckets are compacted.");
-            write.compact(partition, bucket, true);
+            write.compact(partition, bucket, fullCompaction);
         }
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCase.java
index bc849f0a135ff..2c4fb64f331c3 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCase.java
@@ -23,13 +23,9 @@
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.flink.FlinkConnectorOptions;
 import org.apache.paimon.table.FileStoreTable;
-import org.apache.paimon.table.sink.StreamWriteBuilder;
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.table.source.StreamTableScan;
 import org.apache.paimon.table.source.TableScan;
-import org.apache.paimon.types.DataType;
-import org.apache.paimon.types.DataTypes;
-import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.CommonTestUtils;
 import org.apache.paimon.utils.SnapshotManager;
 
@@ -56,12 +52,6 @@
 /** IT cases for {@link CompactAction}. */
 public class CompactActionITCase extends CompactActionITCaseBase {
 
-    private static final DataType[] FIELD_TYPES =
-            new DataType[] {DataTypes.INT(), DataTypes.INT(), DataTypes.INT(), DataTypes.STRING()};
-
-    private static final RowType ROW_TYPE =
-            RowType.of(FIELD_TYPES, new String[] {"k", "v", "hh", "dt"});
-
     @Test
     @Timeout(60)
     public void testBatchCompact() throws Exception {
@@ -402,31 +392,6 @@ public void testWrongUsage() throws Exception {
                 .hasMessage("sort compact do not support 'partition_idle_time'.");
     }
 
-    private FileStoreTable prepareTable(
-            List<String> partitionKeys,
-            List<String> primaryKeys,
-            List<String> bucketKey,
-            Map<String, String> tableOptions)
-            throws Exception {
-        FileStoreTable table =
-                createFileStoreTable(ROW_TYPE, partitionKeys, primaryKeys, bucketKey, tableOptions);
-
-        StreamWriteBuilder streamWriteBuilder =
-                table.newStreamWriteBuilder().withCommitUser(commitUser);
-        write = streamWriteBuilder.newWrite();
-        commit = streamWriteBuilder.newCommit();
-
-        return table;
-    }
-
-    private void checkLatestSnapshot(
-            FileStoreTable table, long snapshotId, Snapshot.CommitKind commitKind) {
-        SnapshotManager snapshotManager = table.snapshotManager();
-        Snapshot snapshot = snapshotManager.snapshot(snapshotManager.latestSnapshotId());
-        assertThat(snapshot.id()).isEqualTo(snapshotId);
-        assertThat(snapshot.commitKind()).isEqualTo(commitKind);
-    }
-
     private void runAction(boolean isStreaming) throws Exception {
         runAction(isStreaming, false);
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCaseBase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCaseBase.java
index 4c646444cb72c..41d01bdf7f35e 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCaseBase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CompactActionITCaseBase.java
@@ -18,17 +18,22 @@
 
 package org.apache.paimon.flink.action;
 
+import org.apache.paimon.Snapshot;
 import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.operation.FileStoreScan;
 import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.sink.StreamWriteBuilder;
 import org.apache.paimon.table.source.StreamTableScan;
 import org.apache.paimon.table.source.TableScan;
+import org.apache.paimon.types.DataType;
+import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.SnapshotManager;
 
 import java.util.ArrayList;
 import java.util.List;
+import java.util.Map;
 import java.util.Objects;
 import java.util.concurrent.TimeoutException;
 
@@ -37,6 +42,12 @@
 /** Base IT cases for {@link CompactAction} and {@link CompactDatabaseAction} . */
 public class CompactActionITCaseBase extends ActionITCaseBase {
 
+    protected static final DataType[] FIELD_TYPES =
+            new DataType[] {DataTypes.INT(), DataTypes.INT(), DataTypes.INT(), DataTypes.STRING()};
+
+    protected static final RowType ROW_TYPE =
+            RowType.of(FIELD_TYPES, new String[] {"k", "v", "hh", "dt"});
+
     protected void validateResult(
             FileStoreTable table,
             RowType rowType,
@@ -87,4 +98,29 @@ protected void checkFileAndRowSize(
         assertThat(files.size()).isEqualTo(fileNum);
         assertThat(count).isEqualTo(rowCount);
     }
+
+    protected void checkLatestSnapshot(
+            FileStoreTable table, long snapshotId, Snapshot.CommitKind commitKind) {
+        SnapshotManager snapshotManager = table.snapshotManager();
+        Snapshot snapshot = snapshotManager.snapshot(snapshotManager.latestSnapshotId());
+        assertThat(snapshot.id()).isEqualTo(snapshotId);
+        assertThat(snapshot.commitKind()).isEqualTo(commitKind);
+    }
+
+    protected FileStoreTable prepareTable(
+            List<String> partitionKeys,
+            List<String> primaryKeys,
+            List<String> bucketKey,
+            Map<String, String> tableOptions)
+            throws Exception {
+        FileStoreTable table =
+                createFileStoreTable(ROW_TYPE, partitionKeys, primaryKeys, bucketKey, tableOptions);
+
+        StreamWriteBuilder streamWriteBuilder =
+                table.newStreamWriteBuilder().withCommitUser(commitUser);
+        write = streamWriteBuilder.newWrite();
+        commit = streamWriteBuilder.newCommit();
+
+        return table;
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/MinorCompactActionITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/MinorCompactActionITCase.java
new file mode 100644
index 0000000000000..0373eb01a2d92
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/MinorCompactActionITCase.java
@@ -0,0 +1,205 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.Snapshot;
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.source.DataSplit;
+
+import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.Timeout;
+
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/** IT cases for compact strategy {@link CompactAction}. */
+public class MinorCompactActionITCase extends CompactActionITCaseBase {
+
+    @Test
+    @Timeout(60)
+    public void testBatchMinorCompactStrategy() throws Exception {
+        FileStoreTable table =
+                prepareTable(
+                        Arrays.asList("dt", "hh"),
+                        Arrays.asList("dt", "hh", "k"),
+                        Collections.emptyList(),
+                        Collections.singletonMap(CoreOptions.WRITE_ONLY.key(), "true"));
+
+        writeData(
+                rowData(1, 100, 15, BinaryString.fromString("20221208")),
+                rowData(1, 100, 16, BinaryString.fromString("20221208")));
+
+        writeData(
+                rowData(2, 100, 15, BinaryString.fromString("20221208")),
+                rowData(2, 100, 16, BinaryString.fromString("20221208")));
+
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        CompactAction action =
+                createAction(
+                        CompactAction.class,
+                        "compact",
+                        "--warehouse",
+                        warehouse,
+                        "--database",
+                        database,
+                        "--table",
+                        tableName,
+                        "--compact_strategy",
+                        "minor",
+                        "--table_conf",
+                        CoreOptions.NUM_SORTED_RUNS_COMPACTION_TRIGGER.key() + "=3");
+        StreamExecutionEnvironment env = streamExecutionEnvironmentBuilder().batchMode().build();
+        action.withStreamExecutionEnvironment(env).build();
+        env.execute();
+
+        // Due to the limitation of parameter 'num-sorted-run.compaction-trigger', so compact is not
+        // performed.
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        // Make par-15 has 3 datafile and par-16 has 2 datafile, so par-16 will not be picked out to
+        // compact.
+        writeData(rowData(2, 100, 15, BinaryString.fromString("20221208")));
+
+        env = streamExecutionEnvironmentBuilder().batchMode().build();
+        action.withStreamExecutionEnvironment(env).build();
+        env.execute();
+
+        checkLatestSnapshot(table, 4, Snapshot.CommitKind.COMPACT);
+
+        List<DataSplit> splits = table.newSnapshotReader().read().dataSplits();
+        assertThat(splits.size()).isEqualTo(2);
+        for (DataSplit split : splits) {
+            // Par-16 is not compacted.
+            assertThat(split.dataFiles().size())
+                    .isEqualTo(split.partition().getInt(1) == 16 ? 2 : 1);
+        }
+    }
+
+    @Test
+    @Timeout(60)
+    public void testBatchFullCompactStrategy() throws Exception {
+        FileStoreTable table =
+                prepareTable(
+                        Arrays.asList("dt", "hh"),
+                        Arrays.asList("dt", "hh", "k"),
+                        Collections.emptyList(),
+                        Collections.singletonMap(CoreOptions.WRITE_ONLY.key(), "true"));
+
+        writeData(
+                rowData(1, 100, 15, BinaryString.fromString("20221208")),
+                rowData(1, 100, 16, BinaryString.fromString("20221208")));
+
+        writeData(
+                rowData(2, 100, 15, BinaryString.fromString("20221208")),
+                rowData(2, 100, 16, BinaryString.fromString("20221208")));
+
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        CompactAction action =
+                createAction(
+                        CompactAction.class,
+                        "compact",
+                        "--warehouse",
+                        warehouse,
+                        "--database",
+                        database,
+                        "--table",
+                        tableName,
+                        "--compact_strategy",
+                        "full",
+                        "--table_conf",
+                        CoreOptions.NUM_SORTED_RUNS_COMPACTION_TRIGGER.key() + "=3");
+        StreamExecutionEnvironment env = streamExecutionEnvironmentBuilder().batchMode().build();
+        action.withStreamExecutionEnvironment(env).build();
+        env.execute();
+
+        checkLatestSnapshot(table, 3, Snapshot.CommitKind.COMPACT);
+
+        List<DataSplit> splits = table.newSnapshotReader().read().dataSplits();
+        assertThat(splits.size()).isEqualTo(2);
+        for (DataSplit split : splits) {
+            assertThat(split.dataFiles().size()).isEqualTo(1);
+        }
+    }
+
+    @Test
+    @Timeout(60)
+    public void testStreamingFullCompactStrategy() throws Exception {
+        prepareTable(
+                Arrays.asList("dt", "hh"),
+                Arrays.asList("dt", "hh", "k"),
+                Collections.emptyList(),
+                Collections.singletonMap(CoreOptions.WRITE_ONLY.key(), "true"));
+        CompactAction action =
+                createAction(
+                        CompactAction.class,
+                        "compact",
+                        "--warehouse",
+                        warehouse,
+                        "--database",
+                        database,
+                        "--table",
+                        tableName,
+                        "--compact_strategy",
+                        "full",
+                        "--table_conf",
+                        CoreOptions.NUM_SORTED_RUNS_COMPACTION_TRIGGER.key() + "=3");
+        StreamExecutionEnvironment env =
+                streamExecutionEnvironmentBuilder().streamingMode().build();
+        Assertions.assertThatThrownBy(() -> action.withStreamExecutionEnvironment(env).build())
+                .hasMessage(
+                        "The full compact strategy is only supported in batch mode. Please add -Dexecution.runtime-mode=BATCH.");
+    }
+
+    @Test
+    @Timeout(60)
+    public void testCompactStrategyWithWrongUsage() throws Exception {
+        prepareTable(
+                Arrays.asList("dt", "hh"),
+                Arrays.asList("dt", "hh", "k"),
+                Collections.emptyList(),
+                Collections.singletonMap(CoreOptions.WRITE_ONLY.key(), "true"));
+        Assertions.assertThatThrownBy(
+                        () ->
+                                createAction(
+                                        CompactAction.class,
+                                        "compact",
+                                        "--warehouse",
+                                        warehouse,
+                                        "--database",
+                                        database,
+                                        "--table",
+                                        tableName,
+                                        "--compact_strategy",
+                                        "wrong_usage",
+                                        "--table_conf",
+                                        CoreOptions.NUM_SORTED_RUNS_COMPACTION_TRIGGER.key()
+                                                + "=3"))
+                .hasMessage(
+                        "The compact strategy only supports 'full' or 'minor', but 'wrong_usage' is configured.");
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/CompactProcedureITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/CompactProcedureITCase.java
index bec669acd30d3..d79d13f0260cd 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/CompactProcedureITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/CompactProcedureITCase.java
@@ -31,6 +31,7 @@
 import org.apache.flink.table.api.config.TableConfigOptions;
 import org.apache.flink.types.Row;
 import org.apache.flink.types.RowKind;
+import org.assertj.core.api.Assertions;
 import org.junit.jupiter.api.Test;
 
 import java.util.List;
@@ -240,6 +241,117 @@ public void testDynamicBucketSortCompact() throws Exception {
         checkLatestSnapshot(table, 21, Snapshot.CommitKind.OVERWRITE);
     }
 
+    // ----------------------- Minor Compact -----------------------
+
+    @Test
+    public void testBatchMinorCompactStrategy() throws Exception {
+        sql(
+                "CREATE TABLE T ("
+                        + " k INT,"
+                        + " v INT,"
+                        + " hh INT,"
+                        + " dt STRING,"
+                        + " PRIMARY KEY (k, dt, hh) NOT ENFORCED"
+                        + ") PARTITIONED BY (dt, hh) WITH ("
+                        + " 'write-only' = 'true',"
+                        + " 'bucket' = '1'"
+                        + ")");
+        FileStoreTable table = paimonTable("T");
+        tEnv.getConfig().set(TableConfigOptions.TABLE_DML_SYNC, true);
+
+        sql("INSERT INTO T VALUES (1, 100, 15, '20221208'), (1, 100, 16, '20221208')");
+        sql("INSERT INTO T VALUES (2, 100, 15, '20221208'), (2, 100, 16, '20221208')");
+
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        sql(
+                "CALL sys.compact(`table` => 'default.T', compact_strategy => 'minor', "
+                        + "options => 'num-sorted-run.compaction-trigger=3')");
+
+        // Due to the limitation of parameter 'num-sorted-run.compaction-trigger' = 3, so compact is
+        // not
+        // performed.
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        // Make par-15 has 3 datafile and par-16 has 2 datafile, so par-16 will not be picked out to
+        // compact.
+        sql("INSERT INTO T VALUES (1, 100, 15, '20221208')");
+
+        sql(
+                "CALL sys.compact(`table` => 'default.T', compact_strategy => 'minor', "
+                        + "options => 'num-sorted-run.compaction-trigger=3')");
+
+        checkLatestSnapshot(table, 4, Snapshot.CommitKind.COMPACT);
+
+        List<DataSplit> splits = table.newSnapshotReader().read().dataSplits();
+        assertThat(splits.size()).isEqualTo(2);
+        for (DataSplit split : splits) {
+            // Par-16 is not compacted.
+            assertThat(split.dataFiles().size())
+                    .isEqualTo(split.partition().getInt(1) == 16 ? 2 : 1);
+        }
+    }
+
+    @Test
+    public void testBatchFullCompactStrategy() throws Exception {
+        sql(
+                "CREATE TABLE T ("
+                        + " k INT,"
+                        + " v INT,"
+                        + " hh INT,"
+                        + " dt STRING,"
+                        + " PRIMARY KEY (k, dt, hh) NOT ENFORCED"
+                        + ") PARTITIONED BY (dt, hh) WITH ("
+                        + " 'write-only' = 'true',"
+                        + " 'bucket' = '1'"
+                        + ")");
+        FileStoreTable table = paimonTable("T");
+        tEnv.getConfig().set(TableConfigOptions.TABLE_DML_SYNC, true);
+
+        sql("INSERT INTO T VALUES (1, 100, 15, '20221208'), (1, 100, 16, '20221208')");
+        sql("INSERT INTO T VALUES (2, 100, 15, '20221208'), (2, 100, 16, '20221208')");
+
+        checkLatestSnapshot(table, 2, Snapshot.CommitKind.APPEND);
+
+        sql(
+                "CALL sys.compact(`table` => 'default.T', compact_strategy => 'full', "
+                        + "options => 'num-sorted-run.compaction-trigger=3')");
+
+        checkLatestSnapshot(table, 3, Snapshot.CommitKind.COMPACT);
+
+        List<DataSplit> splits = table.newSnapshotReader().read().dataSplits();
+        assertThat(splits.size()).isEqualTo(2);
+        for (DataSplit split : splits) {
+            // Par-16 is not compacted.
+            assertThat(split.dataFiles().size()).isEqualTo(1);
+        }
+    }
+
+    @Test
+    public void testStreamFullCompactStrategy() throws Exception {
+        sql(
+                "CREATE TABLE T ("
+                        + " k INT,"
+                        + " v INT,"
+                        + " hh INT,"
+                        + " dt STRING,"
+                        + " PRIMARY KEY (k, dt, hh) NOT ENFORCED"
+                        + ") PARTITIONED BY (dt, hh) WITH ("
+                        + " 'write-only' = 'true',"
+                        + " 'bucket' = '1'"
+                        + ")");
+        tEnv.getConfig().set(TableConfigOptions.TABLE_DML_SYNC, true);
+
+        Assertions.assertThatThrownBy(
+                        () ->
+                                streamSqlIter(
+                                                "CALL sys.compact(`table` => 'default.T', compact_strategy => 'full', "
+                                                        + "options => 'num-sorted-run.compaction-trigger=3')")
+                                        .close())
+                .hasMessageContaining(
+                        "The full compact strategy is only supported in batch mode. Please add -Dexecution.runtime-mode=BATCH.");
+    }
+
     private void checkLatestSnapshot(
             FileStoreTable table, long snapshotId, Snapshot.CommitKind commitKind) {
         SnapshotManager snapshotManager = table.snapshotManager();
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
index c38ac4b3d685c..42293ca2842e1 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
@@ -132,7 +132,7 @@ public void testCompact() throws Exception {
                         .withContinuousMode(false)
                         .withPartitionPredicate(predicate)
                         .build();
-        new CompactorSinkBuilder(table).withFullCompaction(true).withInput(source).build();
+        new CompactorSinkBuilder(table, true).withInput(source).build();
         env.execute();
 
         snapshot = snapshotManager.snapshot(snapshotManager.latestSnapshotId());
@@ -181,8 +181,8 @@ public void testCompactParallelism() throws Exception {
                                                 FlinkConnectorOptions.SINK_PARALLELISM.key(),
                                                 String.valueOf(sinkParalellism));
                                     }
-                                }))
-                .withFullCompaction(false)
+                                }),
+                        false)
                 .withInput(source)
                 .build();
 
@@ -275,7 +275,13 @@ protected StoreCompactOperator createCompactOperator(FileStoreTable table) {
     protected MultiTablesStoreCompactOperator createMultiTablesCompactOperator(
             Catalog.Loader catalogLoader) throws Exception {
         return new MultiTablesStoreCompactOperator(
-                catalogLoader, commitUser, new CheckpointConfig(), false, false, new Options());
+                catalogLoader,
+                commitUser,
+                new CheckpointConfig(),
+                false,
+                false,
+                true,
+                new Options());
     }
 
     private static byte[] partition(String dt, int hh) {
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/CompactProcedure.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/CompactProcedure.java
index 71cf04cf5ef55..4a43e39c31ba1 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/CompactProcedure.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/CompactProcedure.java
@@ -107,6 +107,7 @@ public class CompactProcedure extends BaseProcedure {
             new ProcedureParameter[] {
                 ProcedureParameter.required("table", StringType),
                 ProcedureParameter.optional("partitions", StringType),
+                ProcedureParameter.optional("compact_strategy", StringType),
                 ProcedureParameter.optional("order_strategy", StringType),
                 ProcedureParameter.optional("order_by", StringType),
                 ProcedureParameter.optional("where", StringType),
@@ -120,6 +121,9 @@ public class CompactProcedure extends BaseProcedure {
                         new StructField("result", DataTypes.BooleanType, true, Metadata.empty())
                     });
 
+    private static final String MINOR = "minor";
+    private static final String FULL = "full";
+
     protected CompactProcedure(TableCatalog tableCatalog) {
         super(tableCatalog);
     }
@@ -138,15 +142,17 @@ public StructType outputType() {
     public InternalRow[] call(InternalRow args) {
         Identifier tableIdent = toIdentifier(args.getString(0), PARAMETERS[0].name());
         String partitions = blank(args, 1) ? null : args.getString(1);
-        String sortType = blank(args, 2) ? TableSorter.OrderType.NONE.name() : args.getString(2);
+        // make full compact strategy as default.
+        String compactStrategy = blank(args, 2) ? FULL : args.getString(2);
+        String sortType = blank(args, 3) ? TableSorter.OrderType.NONE.name() : args.getString(3);
         List<String> sortColumns =
-                blank(args, 3)
+                blank(args, 4)
                         ? Collections.emptyList()
-                        : Arrays.asList(args.getString(3).split(","));
-        String where = blank(args, 4) ? null : args.getString(4);
-        String options = args.isNullAt(5) ? null : args.getString(5);
+                        : Arrays.asList(args.getString(4).split(","));
+        String where = blank(args, 5) ? null : args.getString(5);
+        String options = args.isNullAt(6) ? null : args.getString(6);
         Duration partitionIdleTime =
-                blank(args, 6) ? null : TimeUtils.parseDuration(args.getString(6));
+                blank(args, 7) ? null : TimeUtils.parseDuration(args.getString(7));
         if (TableSorter.OrderType.NONE.name().equals(sortType) && !sortColumns.isEmpty()) {
             throw new IllegalArgumentException(
                     "order_strategy \"none\" cannot work with order_by columns.");
@@ -155,6 +161,14 @@ public InternalRow[] call(InternalRow args) {
             throw new IllegalArgumentException(
                     "sort compact do not support 'partition_idle_time'.");
         }
+
+        if (!(compactStrategy.equalsIgnoreCase(FULL) || compactStrategy.equalsIgnoreCase(MINOR))) {
+            throw new IllegalArgumentException(
+                    String.format(
+                            "The compact strategy only supports 'full' or 'minor', but '%s' is configured.",
+                            compactStrategy));
+        }
+
         checkArgument(
                 partitions == null || where == null,
                 "partitions and where cannot be used together.");
@@ -192,6 +206,7 @@ public InternalRow[] call(InternalRow args) {
                             newInternalRow(
                                     execute(
                                             (FileStoreTable) table,
+                                            compactStrategy,
                                             sortType,
                                             sortColumns,
                                             relation,
@@ -212,6 +227,7 @@ private boolean blank(InternalRow args, int index) {
 
     private boolean execute(
             FileStoreTable table,
+            String compactStrategy,
             String sortType,
             List<String> sortColumns,
             DataSourceV2Relation relation,
@@ -219,6 +235,7 @@ private boolean execute(
             @Nullable Duration partitionIdleTime) {
         BucketMode bucketMode = table.bucketMode();
         TableSorter.OrderType orderType = TableSorter.OrderType.of(sortType);
+        boolean fullCompact = compactStrategy.equalsIgnoreCase(FULL);
         Predicate filter =
                 condition == null
                         ? null
@@ -233,7 +250,8 @@ private boolean execute(
             switch (bucketMode) {
                 case HASH_FIXED:
                 case HASH_DYNAMIC:
-                    compactAwareBucketTable(table, filter, partitionIdleTime, javaSparkContext);
+                    compactAwareBucketTable(
+                            table, fullCompact, filter, partitionIdleTime, javaSparkContext);
                     break;
                 case BUCKET_UNAWARE:
                     compactUnAwareBucketTable(table, filter, partitionIdleTime, javaSparkContext);
@@ -259,6 +277,7 @@ private boolean execute(
 
     private void compactAwareBucketTable(
             FileStoreTable table,
+            boolean fullCompact,
             @Nullable Predicate filter,
             @Nullable Duration partitionIdleTime,
             JavaSparkContext javaSparkContext) {
@@ -304,7 +323,7 @@ private void compactAwareBucketTable(
                                                             SerializationUtils.deserializeBinaryRow(
                                                                     pair.getLeft()),
                                                             pair.getRight(),
-                                                            true);
+                                                            fullCompact);
                                                 }
                                                 CommitMessageSerializer serializer =
                                                         new CommitMessageSerializer();
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
index 130860c8351e8..31f78f61c20d9 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/CompactProcedureTestBase.scala
@@ -39,6 +39,56 @@ abstract class CompactProcedureTestBase extends PaimonSparkTestBase with StreamT
 
   import testImplicits._
 
+  // ----------------------- Minor Compact -----------------------
+
+  test("Paimon Procedure: compact aware bucket pk table with minor compact strategy") {
+    withTable("T") {
+      spark.sql(s"""
+                   |CREATE TABLE T (id INT, value STRING, pt STRING)
+                   |TBLPROPERTIES ('primary-key'='id, pt', 'bucket'='1', 'write-only'='true')
+                   |PARTITIONED BY (pt)
+                   |""".stripMargin)
+
+      val table = loadTable("T")
+
+      spark.sql(s"INSERT INTO T VALUES (1, 'a', 'p1'), (2, 'b', 'p2')")
+      spark.sql(s"INSERT INTO T VALUES (3, 'c', 'p1'), (4, 'd', 'p2')")
+
+      Assertions.assertThat(lastSnapshotCommand(table).equals(CommitKind.APPEND)).isTrue
+      Assertions.assertThat(lastSnapshotId(table)).isEqualTo(2)
+
+      spark.sql(
+        "CALL sys.compact(table => 'T', compact_strategy => 'minor'," +
+          "options => 'num-sorted-run.compaction-trigger=3')")
+
+      // Due to the limitation of parameter 'num-sorted-run.compaction-trigger' = 3, so compact is not
+      // performed.
+      Assertions.assertThat(lastSnapshotCommand(table).equals(CommitKind.APPEND)).isTrue
+      Assertions.assertThat(lastSnapshotId(table)).isEqualTo(2)
+
+      // Make par-p1 has 3 datafile and par-p2 has 2 datafile, so par-p2 will not be picked out to
+      // compact.
+      spark.sql(s"INSERT INTO T VALUES (1, 'a', 'p1')")
+
+      spark.sql(
+        "CALL sys.compact(table => 'T', compact_strategy => 'minor'," +
+          "options => 'num-sorted-run.compaction-trigger=3')")
+
+      Assertions.assertThat(lastSnapshotId(table)).isEqualTo(4)
+      Assertions.assertThat(lastSnapshotCommand(table).equals(CommitKind.COMPACT)).isTrue
+
+      val splits = table.newSnapshotReader.read.dataSplits
+      splits.forEach(
+        split => {
+          Assertions
+            .assertThat(split.dataFiles.size)
+            .isEqualTo(if (split.partition().getString(0).toString == "p2") 2 else 1)
+        })
+    }
+  }
+
+  // ----------------------- Sort Compact -----------------------
+
   test("Paimon Procedure: sort compact") {
     failAfter(streamingTimeout) {
       withTempDir {

From cdd4061db4b43393aab6fc5b2ce2c13ed34c69f3 Mon Sep 17 00:00:00 2001
From: xleoken <xleoken@163.com>
Date: Thu, 28 Nov 2024 14:31:01 +0800
Subject: [PATCH 076/157] [core] Improve the performance of show tables with
 hive metastore (#4605)

---
 .../src/main/java/org/apache/paimon/hive/HiveCatalog.java   | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 0ecc78469e154..9a90995f282d2 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -1017,10 +1017,8 @@ public Table getHmsTable(Identifier identifier) throws TableNotExistException {
 
     private boolean isPaimonTable(Identifier identifier, Table table) {
         return isPaimonTable(table)
-                && tableSchemaInFileSystem(
-                                getTableLocation(identifier, table),
-                                identifier.getBranchNameOrDefault())
-                        .isPresent();
+                && tableExistsInFileSystem(
+                        getTableLocation(identifier, table), identifier.getBranchNameOrDefault());
     }
 
     private static boolean isPaimonTable(Table table) {

From 0fe18e89f04f2c32a7d41560dfa2ac03134904b1 Mon Sep 17 00:00:00 2001
From: lining <jinglining0@gmail.com>
Date: Thu, 28 Nov 2024 19:58:31 +0800
Subject: [PATCH 077/157] [core] Add basic implementation to support REST
 Catalog (#4553)

---
 .../apache/paimon/utils/ThreadPoolUtils.java  |  12 +-
 paimon-core/pom.xml                           |  57 +++++
 .../paimon/rest/DefaultErrorHandler.java      |  61 ++++++
 .../org/apache/paimon/rest/ErrorHandler.java  |  26 +++
 .../org/apache/paimon/rest/HttpClient.java    | 142 +++++++++++++
 .../apache/paimon/rest/HttpClientOptions.java |  74 +++++++
 .../org/apache/paimon/rest/RESTCatalog.java   | 197 ++++++++++++++++++
 .../paimon/rest/RESTCatalogFactory.java       |  38 ++++
 .../rest/RESTCatalogInternalOptions.java      |  31 +++
 .../paimon/rest/RESTCatalogOptions.java       |  53 +++++
 .../org/apache/paimon/rest/RESTClient.java    |  31 +++
 .../org/apache/paimon/rest/RESTMessage.java   |  22 ++
 .../apache/paimon/rest/RESTObjectMapper.java  |  35 ++++
 .../org/apache/paimon/rest/RESTRequest.java   |  22 ++
 .../org/apache/paimon/rest/RESTResponse.java  |  22 ++
 .../java/org/apache/paimon/rest/RESTUtil.java |  55 +++++
 .../org/apache/paimon/rest/ResourcePaths.java |  34 +++
 .../rest/exceptions/BadRequestException.java  |  27 +++
 .../rest/exceptions/ForbiddenException.java   |  26 +++
 .../exceptions/NotAuthorizedException.java    |  26 +++
 .../paimon/rest/exceptions/RESTException.java |  30 +++
 .../exceptions/ServiceFailureException.java   |  26 +++
 .../ServiceUnavailableException.java          |  26 +++
 .../paimon/rest/responses/ConfigResponse.java |  76 +++++++
 .../paimon/rest/responses/ErrorResponse.java  |  91 ++++++++
 .../src/main/resources/META-INF/NOTICE        |   8 +
 .../org.apache.paimon.factories.Factory       |   1 +
 .../paimon/rest/DefaultErrorHandlerTest.java  |  77 +++++++
 .../apache/paimon/rest/HttpClientTest.java    | 129 ++++++++++++
 .../org/apache/paimon/rest/MockRESTData.java  |  44 ++++
 .../apache/paimon/rest/RESTCatalogTest.java   |  86 ++++++++
 .../paimon/rest/RESTObjectMapperTest.java     |  59 ++++++
 paimon-open-api/Makefile                      |  25 +++
 paimon-open-api/README.md                     |  10 +
 paimon-open-api/generate.sh                   |  48 +++++
 paimon-open-api/pom.xml                       |  85 ++++++++
 paimon-open-api/rest-catalog-open-api.yaml    |  60 ++++++
 .../paimon/open/api/OpenApiApplication.java   |  31 +++
 .../open/api/RESTCatalogController.java       |  69 ++++++
 .../paimon/open/api/config/OpenAPIConfig.java |  60 ++++++
 .../src/main/resources/application.properties |  22 ++
 pom.xml                                       |   1 +
 42 files changed, 2054 insertions(+), 1 deletion(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/ErrorHandler.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/HttpClientOptions.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogFactory.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTObjectMapper.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTRequest.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTResponse.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/RESTUtil.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/BadRequestException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ForbiddenException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NotAuthorizedException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/RESTException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceFailureException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceUnavailableException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
 create mode 100644 paimon-core/src/main/resources/META-INF/NOTICE
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
 create mode 100644 paimon-open-api/Makefile
 create mode 100644 paimon-open-api/README.md
 create mode 100755 paimon-open-api/generate.sh
 create mode 100644 paimon-open-api/pom.xml
 create mode 100644 paimon-open-api/rest-catalog-open-api.yaml
 create mode 100644 paimon-open-api/src/main/java/org/apache/paimon/open/api/OpenApiApplication.java
 create mode 100644 paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
 create mode 100644 paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
 create mode 100644 paimon-open-api/src/main/resources/application.properties

diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
index 112b9ad1cda28..f8959def67d13 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
@@ -30,6 +30,7 @@
 import java.util.List;
 import java.util.NoSuchElementException;
 import java.util.Queue;
+import java.util.concurrent.BlockingQueue;
 import java.util.concurrent.ExecutionException;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
@@ -54,13 +55,22 @@ public class ThreadPoolUtils {
      * is max thread number.
      */
     public static ThreadPoolExecutor createCachedThreadPool(int threadNum, String namePrefix) {
+        return createCachedThreadPool(threadNum, namePrefix, new LinkedBlockingQueue<>());
+    }
+
+    /**
+     * Create a thread pool with max thread number and define queue. Inactive threads will
+     * automatically exit.
+     */
+    public static ThreadPoolExecutor createCachedThreadPool(
+            int threadNum, String namePrefix, BlockingQueue<Runnable> workQueue) {
         ThreadPoolExecutor executor =
                 new ThreadPoolExecutor(
                         threadNum,
                         threadNum,
                         1,
                         TimeUnit.MINUTES,
-                        new LinkedBlockingQueue<>(),
+                        workQueue,
                         newDaemonThreadFactory(namePrefix));
         executor.allowCoreThreadTimeOut(true);
         return executor;
diff --git a/paimon-core/pom.xml b/paimon-core/pom.xml
index 399f0b5d6c19a..e137d57a6db15 100644
--- a/paimon-core/pom.xml
+++ b/paimon-core/pom.xml
@@ -33,6 +33,7 @@ under the License.
 
     <properties>
         <frocksdbjni.version>6.20.3-ververica-2.0</frocksdbjni.version>
+        <okhttp.version>4.12.0</okhttp.version>
     </properties>
 
     <dependencies>
@@ -63,6 +64,14 @@ under the License.
             <scope>provided</scope>
         </dependency>
 
+        <!-- REST Catalog dependencies -->
+
+        <dependency>
+            <groupId>com.squareup.okhttp3</groupId>
+            <artifactId>okhttp</artifactId>
+            <version>${okhttp.version}</version>
+        </dependency>
+
         <!-- test dependencies -->
 
         <dependency>
@@ -204,6 +213,20 @@ under the License.
             <scope>test</scope>
         </dependency>
 
+        <dependency>
+            <groupId>com.squareup.okhttp3</groupId>
+            <artifactId>mockwebserver</artifactId>
+            <version>${okhttp.version}</version>
+            <scope>test</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.mockito</groupId>
+            <artifactId>mockito-core</artifactId>
+            <version>${mockito.version}</version>
+            <type>jar</type>
+            <scope>test</scope>
+        </dependency>
+
     </dependencies>
 
     <build>
@@ -219,6 +242,40 @@ under the License.
                     </execution>
                 </executions>
             </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-shade-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>shade-paimon</id>
+                        <phase>package</phase>
+                        <goals>
+                            <goal>shade</goal>
+                        </goals>
+                        <configuration>
+                            <filters>
+                                <filter>
+                                    <artifact>*</artifact>
+                                    <excludes>
+                                        <exclude>okhttp3/internal/publicsuffix/NOTICE</exclude>
+                                    </excludes>
+                                </filter>
+                            </filters>
+                            <artifactSet>
+                                <includes combine.children="append">
+                                    <include>com.squareup.okhttp3:okhttp</include>
+                                </includes>
+                            </artifactSet>
+                            <relocations>
+                                <relocation>
+                                    <pattern>okhttp3</pattern>
+                                    <shadedPattern>org.apache.paimon.shade.okhttp3</shadedPattern>
+                                </relocation>
+                            </relocations>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
         </plugins>
     </build>
 </project>
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java b/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
new file mode 100644
index 0000000000000..1a8618c1c603f
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
@@ -0,0 +1,61 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.exceptions.BadRequestException;
+import org.apache.paimon.rest.exceptions.ForbiddenException;
+import org.apache.paimon.rest.exceptions.NotAuthorizedException;
+import org.apache.paimon.rest.exceptions.RESTException;
+import org.apache.paimon.rest.exceptions.ServiceFailureException;
+import org.apache.paimon.rest.exceptions.ServiceUnavailableException;
+import org.apache.paimon.rest.responses.ErrorResponse;
+
+/** Default error handler. */
+public class DefaultErrorHandler extends ErrorHandler {
+    private static final ErrorHandler INSTANCE = new DefaultErrorHandler();
+
+    public static ErrorHandler getInstance() {
+        return INSTANCE;
+    }
+
+    @Override
+    public void accept(ErrorResponse error) {
+        int code = error.code();
+        switch (code) {
+            case 400:
+                throw new BadRequestException(
+                        String.format("Malformed request: %s", error.message()));
+            case 401:
+                throw new NotAuthorizedException("Not authorized: %s", error.message());
+            case 403:
+                throw new ForbiddenException("Forbidden: %s", error.message());
+            case 405:
+            case 406:
+                break;
+            case 500:
+                throw new ServiceFailureException("Server error: %s", error.message());
+            case 501:
+                throw new UnsupportedOperationException(error.message());
+            case 503:
+                throw new ServiceUnavailableException("Service unavailable: %s", error.message());
+        }
+
+        throw new RESTException("Unable to process: %s", error.message());
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/ErrorHandler.java b/paimon-core/src/main/java/org/apache/paimon/rest/ErrorHandler.java
new file mode 100644
index 0000000000000..cdfa4bcdfaac6
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/ErrorHandler.java
@@ -0,0 +1,26 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.responses.ErrorResponse;
+
+import java.util.function.Consumer;
+
+/** Error handler for REST client. */
+public abstract class ErrorHandler implements Consumer<ErrorResponse> {}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
new file mode 100644
index 0000000000000..e092711e5f971
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
@@ -0,0 +1,142 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.exceptions.RESTException;
+import org.apache.paimon.rest.responses.ErrorResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.core.JsonProcessingException;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import okhttp3.Dispatcher;
+import okhttp3.Headers;
+import okhttp3.MediaType;
+import okhttp3.OkHttpClient;
+import okhttp3.Request;
+import okhttp3.RequestBody;
+import okhttp3.Response;
+
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.Map;
+import java.util.concurrent.BlockingQueue;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.SynchronousQueue;
+
+import static okhttp3.ConnectionSpec.CLEARTEXT;
+import static okhttp3.ConnectionSpec.COMPATIBLE_TLS;
+import static okhttp3.ConnectionSpec.MODERN_TLS;
+import static org.apache.paimon.utils.ThreadPoolUtils.createCachedThreadPool;
+
+/** HTTP client for REST catalog. */
+public class HttpClient implements RESTClient {
+
+    private final OkHttpClient okHttpClient;
+    private final String uri;
+    private final ObjectMapper mapper;
+    private final ErrorHandler errorHandler;
+
+    private static final String THREAD_NAME = "REST-CATALOG-HTTP-CLIENT-THREAD-POOL";
+    private static final MediaType MEDIA_TYPE = MediaType.parse("application/json");
+
+    public HttpClient(HttpClientOptions httpClientOptions) {
+        this.uri = httpClientOptions.uri();
+        this.mapper = httpClientOptions.mapper();
+        this.okHttpClient = createHttpClient(httpClientOptions);
+        this.errorHandler = httpClientOptions.errorHandler();
+    }
+
+    @Override
+    public <T extends RESTResponse> T get(
+            String path, Class<T> responseType, Map<String, String> headers) {
+        try {
+            Request request =
+                    new Request.Builder()
+                            .url(uri + path)
+                            .get()
+                            .headers(Headers.of(headers))
+                            .build();
+            return exec(request, responseType);
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    @Override
+    public <T extends RESTResponse> T post(
+            String path, RESTRequest body, Class<T> responseType, Map<String, String> headers) {
+        try {
+            RequestBody requestBody = buildRequestBody(body);
+            Request request =
+                    new Request.Builder()
+                            .url(uri + path)
+                            .post(requestBody)
+                            .headers(Headers.of(headers))
+                            .build();
+            return exec(request, responseType);
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    @Override
+    public void close() throws IOException {
+        okHttpClient.dispatcher().cancelAll();
+        okHttpClient.connectionPool().evictAll();
+    }
+
+    private <T extends RESTResponse> T exec(Request request, Class<T> responseType) {
+        try (Response response = okHttpClient.newCall(request).execute()) {
+            String responseBodyStr = response.body() != null ? response.body().string() : null;
+            if (!response.isSuccessful()) {
+                ErrorResponse error =
+                        new ErrorResponse(
+                                responseBodyStr != null ? responseBodyStr : "response body is null",
+                                response.code());
+                errorHandler.accept(error);
+            }
+            if (responseBodyStr == null) {
+                throw new RESTException("response body is null.");
+            }
+            return mapper.readValue(responseBodyStr, responseType);
+        } catch (Exception e) {
+            throw new RESTException(e, "rest exception");
+        }
+    }
+
+    private RequestBody buildRequestBody(RESTRequest body) throws JsonProcessingException {
+        return RequestBody.create(mapper.writeValueAsBytes(body), MEDIA_TYPE);
+    }
+
+    private static OkHttpClient createHttpClient(HttpClientOptions httpClientOptions) {
+        BlockingQueue<Runnable> workQueue = new SynchronousQueue<>();
+        ExecutorService executorService =
+                createCachedThreadPool(httpClientOptions.threadPoolSize(), THREAD_NAME, workQueue);
+
+        OkHttpClient.Builder builder =
+                new OkHttpClient.Builder()
+                        .dispatcher(new Dispatcher(executorService))
+                        .retryOnConnectionFailure(true)
+                        .connectionSpecs(Arrays.asList(MODERN_TLS, COMPATIBLE_TLS, CLEARTEXT));
+        httpClientOptions.connectTimeout().ifPresent(builder::connectTimeout);
+        httpClientOptions.readTimeout().ifPresent(builder::readTimeout);
+
+        return builder.build();
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClientOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClientOptions.java
new file mode 100644
index 0000000000000..694779cfdb86f
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClientOptions.java
@@ -0,0 +1,74 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import java.time.Duration;
+import java.util.Optional;
+
+/** Options for Http Client. */
+public class HttpClientOptions {
+
+    private final String uri;
+    private final Optional<Duration> connectTimeout;
+    private final Optional<Duration> readTimeout;
+    private final ObjectMapper mapper;
+    private final int threadPoolSize;
+    private final ErrorHandler errorHandler;
+
+    public HttpClientOptions(
+            String uri,
+            Optional<Duration> connectTimeout,
+            Optional<Duration> readTimeout,
+            ObjectMapper mapper,
+            int threadPoolSize,
+            ErrorHandler errorHandler) {
+        this.uri = uri;
+        this.connectTimeout = connectTimeout;
+        this.readTimeout = readTimeout;
+        this.mapper = mapper;
+        this.threadPoolSize = threadPoolSize;
+        this.errorHandler = errorHandler;
+    }
+
+    public String uri() {
+        return uri;
+    }
+
+    public Optional<Duration> connectTimeout() {
+        return connectTimeout;
+    }
+
+    public Optional<Duration> readTimeout() {
+        return readTimeout;
+    }
+
+    public ObjectMapper mapper() {
+        return mapper;
+    }
+
+    public int threadPoolSize() {
+        return threadPoolSize;
+    }
+
+    public ErrorHandler errorHandler() {
+        return errorHandler;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
new file mode 100644
index 0000000000000..c96400831370c
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
@@ -0,0 +1,197 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.annotation.VisibleForTesting;
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.Database;
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.manifest.PartitionEntry;
+import org.apache.paimon.options.CatalogOptions;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.responses.ConfigResponse;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.schema.SchemaChange;
+import org.apache.paimon.table.Table;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+
+/** A catalog implementation for REST. */
+public class RESTCatalog implements Catalog {
+    private RESTClient client;
+    private String token;
+    private ResourcePaths resourcePaths;
+    private Map<String, String> options;
+    private Map<String, String> baseHeader;
+
+    private static final ObjectMapper objectMapper = RESTObjectMapper.create();
+    static final String AUTH_HEADER = "Authorization";
+    static final String AUTH_HEADER_VALUE_FORMAT = "Bearer %s";
+
+    public RESTCatalog(Options options) {
+        if (options.getOptional(CatalogOptions.WAREHOUSE).isPresent()) {
+            throw new IllegalArgumentException("Can not config warehouse in RESTCatalog.");
+        }
+        String uri = options.get(RESTCatalogOptions.URI);
+        token = options.get(RESTCatalogOptions.TOKEN);
+        Optional<Duration> connectTimeout =
+                options.getOptional(RESTCatalogOptions.CONNECTION_TIMEOUT);
+        Optional<Duration> readTimeout = options.getOptional(RESTCatalogOptions.READ_TIMEOUT);
+        Integer threadPoolSize = options.get(RESTCatalogOptions.THREAD_POOL_SIZE);
+        HttpClientOptions httpClientOptions =
+                new HttpClientOptions(
+                        uri,
+                        connectTimeout,
+                        readTimeout,
+                        objectMapper,
+                        threadPoolSize,
+                        DefaultErrorHandler.getInstance());
+        this.client = new HttpClient(httpClientOptions);
+        Map<String, String> authHeaders =
+                ImmutableMap.of(AUTH_HEADER, String.format(AUTH_HEADER_VALUE_FORMAT, token));
+        Map<String, String> initHeaders =
+                RESTUtil.merge(configHeaders(options.toMap()), authHeaders);
+        this.options = fetchOptionsFromServer(initHeaders, options.toMap());
+        this.baseHeader = configHeaders(this.options());
+        this.resourcePaths =
+                ResourcePaths.forCatalogProperties(
+                        this.options.get(RESTCatalogInternalOptions.PREFIX));
+    }
+
+    @Override
+    public String warehouse() {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public Map<String, String> options() {
+        return this.options;
+    }
+
+    @Override
+    public FileIO fileIO() {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public List<String> listDatabases() {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void createDatabase(String name, boolean ignoreIfExists, Map<String, String> properties)
+            throws DatabaseAlreadyExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public Database getDatabase(String name) throws DatabaseNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void dropDatabase(String name, boolean ignoreIfNotExists, boolean cascade)
+            throws DatabaseNotExistException, DatabaseNotEmptyException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public Table getTable(Identifier identifier) throws TableNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public Path getTableLocation(Identifier identifier) {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public List<String> listTables(String databaseName) throws DatabaseNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void dropTable(Identifier identifier, boolean ignoreIfNotExists)
+            throws TableNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void createTable(Identifier identifier, Schema schema, boolean ignoreIfExists)
+            throws TableAlreadyExistException, DatabaseNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void renameTable(Identifier fromTable, Identifier toTable, boolean ignoreIfNotExists)
+            throws TableNotExistException, TableAlreadyExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void alterTable(
+            Identifier identifier, List<SchemaChange> changes, boolean ignoreIfNotExists)
+            throws TableNotExistException, ColumnAlreadyExistException, ColumnNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void createPartition(Identifier identifier, Map<String, String> partitionSpec)
+            throws TableNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public void dropPartition(Identifier identifier, Map<String, String> partitions)
+            throws TableNotExistException, PartitionNotExistException {}
+
+    @Override
+    public List<PartitionEntry> listPartitions(Identifier identifier)
+            throws TableNotExistException {
+        throw new UnsupportedOperationException();
+    }
+
+    @Override
+    public boolean allowUpperCase() {
+        return false;
+    }
+
+    @Override
+    public void close() throws Exception {}
+
+    @VisibleForTesting
+    Map<String, String> fetchOptionsFromServer(
+            Map<String, String> headers, Map<String, String> clientProperties) {
+        ConfigResponse response =
+                client.get(ResourcePaths.V1_CONFIG, ConfigResponse.class, headers);
+        return response.merge(clientProperties);
+    }
+
+    private static Map<String, String> configHeaders(Map<String, String> properties) {
+        return RESTUtil.extractPrefixMap(properties, "header.");
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogFactory.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogFactory.java
new file mode 100644
index 0000000000000..a5c773cb4bd5e
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogFactory.java
@@ -0,0 +1,38 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.CatalogContext;
+import org.apache.paimon.catalog.CatalogFactory;
+
+/** Factory to create {@link RESTCatalog}. */
+public class RESTCatalogFactory implements CatalogFactory {
+    public static final String IDENTIFIER = "rest";
+
+    @Override
+    public String identifier() {
+        return IDENTIFIER;
+    }
+
+    @Override
+    public Catalog create(CatalogContext context) {
+        return new RESTCatalog(context.options());
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
new file mode 100644
index 0000000000000..cf61caa20e887
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.options.ConfigOption;
+import org.apache.paimon.options.ConfigOptions;
+
+/** Internal options for REST Catalog. */
+public class RESTCatalogInternalOptions {
+    public static final ConfigOption<String> PREFIX =
+            ConfigOptions.key("prefix")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog uri's prefix.");
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
new file mode 100644
index 0000000000000..6155b893751b1
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.options.ConfigOption;
+import org.apache.paimon.options.ConfigOptions;
+
+import java.time.Duration;
+
+/** Options for REST Catalog. */
+public class RESTCatalogOptions {
+    public static final ConfigOption<String> URI =
+            ConfigOptions.key("uri")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog server's uri.");
+    public static final ConfigOption<String> TOKEN =
+            ConfigOptions.key("token")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog server's auth token.");
+    public static final ConfigOption<Duration> CONNECTION_TIMEOUT =
+            ConfigOptions.key("rest.client.connection-timeout")
+                    .durationType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog http client connect timeout.");
+    public static final ConfigOption<Duration> READ_TIMEOUT =
+            ConfigOptions.key("rest.client.read-timeout")
+                    .durationType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog http client read timeout.");
+    public static final ConfigOption<Integer> THREAD_POOL_SIZE =
+            ConfigOptions.key("rest.client.num-threads")
+                    .intType()
+                    .defaultValue(1)
+                    .withDescription("REST Catalog http client thread num.");
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
new file mode 100644
index 0000000000000..feeed06a417ac
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import java.io.Closeable;
+import java.util.Map;
+
+/** Interface for a basic HTTP Client for interfacing with the REST catalog. */
+public interface RESTClient extends Closeable {
+
+    <T extends RESTResponse> T get(String path, Class<T> responseType, Map<String, String> headers);
+
+    <T extends RESTResponse> T post(
+            String path, RESTRequest body, Class<T> responseType, Map<String, String> headers);
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
new file mode 100644
index 0000000000000..6cb0b6fa6573b
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+/** Interface to mark both REST requests and responses. */
+public interface RESTMessage {}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTObjectMapper.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTObjectMapper.java
new file mode 100644
index 0000000000000..b1c83e90224ad
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTObjectMapper.java
@@ -0,0 +1,35 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.DeserializationFeature;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.SerializationFeature;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.datatype.jsr310.JavaTimeModule;
+
+/** Object mapper for REST request and response. */
+public class RESTObjectMapper {
+    public static ObjectMapper create() {
+        ObjectMapper mapper = new ObjectMapper();
+        mapper.configure(DeserializationFeature.FAIL_ON_UNKNOWN_PROPERTIES, false);
+        mapper.configure(SerializationFeature.FAIL_ON_EMPTY_BEANS, false);
+        mapper.registerModule(new JavaTimeModule());
+        return mapper;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTRequest.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTRequest.java
new file mode 100644
index 0000000000000..9c6758df14f04
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTRequest.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+/** Interface to mark a REST request. */
+public interface RESTRequest extends RESTMessage {}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTResponse.java
new file mode 100644
index 0000000000000..a4149d3fda145
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTResponse.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+/** Interface to mark a REST response. */
+public interface RESTResponse extends RESTMessage {}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTUtil.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTUtil.java
new file mode 100644
index 0000000000000..3d42e99fa6d59
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTUtil.java
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.guava30.com.google.common.collect.Maps;
+
+import java.util.Map;
+
+/** Util for REST. */
+public class RESTUtil {
+    public static Map<String, String> extractPrefixMap(
+            Map<String, String> properties, String prefix) {
+        Preconditions.checkNotNull(properties, "Invalid properties map: null");
+        Map<String, String> result = Maps.newHashMap();
+        for (Map.Entry<String, String> entry : properties.entrySet()) {
+            if (entry.getKey() != null && entry.getKey().startsWith(prefix)) {
+                result.put(
+                        entry.getKey().substring(prefix.length()), properties.get(entry.getKey()));
+            }
+        }
+        return result;
+    }
+
+    public static Map<String, String> merge(
+            Map<String, String> target, Map<String, String> updates) {
+        ImmutableMap.Builder<String, String> builder = ImmutableMap.builder();
+        for (Map.Entry<String, String> entry : target.entrySet()) {
+            if (!updates.containsKey(entry.getKey())) {
+                builder.put(entry.getKey(), entry.getValue());
+            }
+        }
+        updates.forEach(builder::put);
+
+        return builder.build();
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
new file mode 100644
index 0000000000000..1fad87588a33e
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
@@ -0,0 +1,34 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+/** Resource paths for REST catalog. */
+public class ResourcePaths {
+    public static final String V1_CONFIG = "/api/v1/config";
+
+    public static ResourcePaths forCatalogProperties(String prefix) {
+        return new ResourcePaths(prefix);
+    }
+
+    private final String prefix;
+
+    public ResourcePaths(String prefix) {
+        this.prefix = prefix;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/BadRequestException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/BadRequestException.java
new file mode 100644
index 0000000000000..301f3bd63f88d
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/BadRequestException.java
@@ -0,0 +1,27 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 400 - Bad Request. */
+public class BadRequestException extends RESTException {
+
+    public BadRequestException(String message, Object... args) {
+        super(message, args);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ForbiddenException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ForbiddenException.java
new file mode 100644
index 0000000000000..3982e5b704177
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ForbiddenException.java
@@ -0,0 +1,26 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 403 Forbidden. */
+public class ForbiddenException extends RESTException {
+    public ForbiddenException(String message, Object... args) {
+        super(message, args);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NotAuthorizedException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NotAuthorizedException.java
new file mode 100644
index 0000000000000..43c13b1a1c979
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NotAuthorizedException.java
@@ -0,0 +1,26 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 401 Unauthorized. */
+public class NotAuthorizedException extends RESTException {
+    public NotAuthorizedException(String message, Object... args) {
+        super(String.format(message, args));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/RESTException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/RESTException.java
new file mode 100644
index 0000000000000..532936f43032d
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/RESTException.java
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Base class for REST client exceptions. */
+public class RESTException extends RuntimeException {
+    public RESTException(String message, Object... args) {
+        super(String.format(message, args));
+    }
+
+    public RESTException(Throwable cause, String message, Object... args) {
+        super(String.format(message, args), cause);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceFailureException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceFailureException.java
new file mode 100644
index 0000000000000..45c48ec0de094
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceFailureException.java
@@ -0,0 +1,26 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 500 - Bad Request. */
+public class ServiceFailureException extends RESTException {
+    public ServiceFailureException(String message, Object... args) {
+        super(String.format(message, args));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceUnavailableException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceUnavailableException.java
new file mode 100644
index 0000000000000..fb6a05e89f9f3
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/ServiceUnavailableException.java
@@ -0,0 +1,26 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 503 - service is unavailable. */
+public class ServiceUnavailableException extends RESTException {
+    public ServiceUnavailableException(String message, Object... args) {
+        super(String.format(message, args));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
new file mode 100644
index 0000000000000..e6bc934703642
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
@@ -0,0 +1,76 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.rest.RESTResponse;
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.guava30.com.google.common.collect.Maps;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+
+import java.beans.ConstructorProperties;
+import java.util.Map;
+import java.util.Objects;
+
+/** Response for getting config. */
+@JsonIgnoreProperties(ignoreUnknown = true)
+public class ConfigResponse implements RESTResponse {
+    private static final String FIELD_DEFAULTS = "defaults";
+    private static final String FIELD_OVERRIDES = "overrides";
+
+    @JsonProperty(FIELD_DEFAULTS)
+    private Map<String, String> defaults;
+
+    @JsonProperty(FIELD_OVERRIDES)
+    private Map<String, String> overrides;
+
+    @ConstructorProperties({FIELD_DEFAULTS, FIELD_OVERRIDES})
+    public ConfigResponse(Map<String, String> defaults, Map<String, String> overrides) {
+        this.defaults = defaults;
+        this.overrides = overrides;
+    }
+
+    public Map<String, String> merge(Map<String, String> clientProperties) {
+        Preconditions.checkNotNull(
+                clientProperties,
+                "Cannot merge client properties with server-provided properties. Invalid client configuration: null");
+        Map<String, String> merged =
+                defaults != null ? Maps.newHashMap(defaults) : Maps.newHashMap();
+        merged.putAll(clientProperties);
+
+        if (overrides != null) {
+            merged.putAll(overrides);
+        }
+
+        return ImmutableMap.copyOf(Maps.filterValues(merged, Objects::nonNull));
+    }
+
+    @JsonGetter(FIELD_DEFAULTS)
+    public Map<String, String> defaults() {
+        return defaults;
+    }
+
+    @JsonGetter(FIELD_OVERRIDES)
+    public Map<String, String> overrides() {
+        return overrides;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
new file mode 100644
index 0000000000000..0e4b234867329
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
@@ -0,0 +1,91 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+
+import java.beans.ConstructorProperties;
+import java.io.PrintWriter;
+import java.io.StringWriter;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+
+/** Response for error. */
+public class ErrorResponse {
+    private static final String FIELD_MESSAGE = "message";
+    private static final String FIELD_CODE = "code";
+    private static final String FIELD_STACK = "stack";
+
+    @JsonProperty(FIELD_MESSAGE)
+    private final String message;
+
+    @JsonProperty(FIELD_CODE)
+    private final Integer code;
+
+    @JsonProperty(FIELD_STACK)
+    private final List<String> stack;
+
+    public ErrorResponse(String message, Integer code) {
+        this.code = code;
+        this.message = message;
+        this.stack = new ArrayList<String>();
+    }
+
+    @ConstructorProperties({FIELD_MESSAGE, FIELD_CODE, FIELD_STACK})
+    public ErrorResponse(String message, int code, List<String> stack) {
+        this.message = message;
+        this.code = code;
+        this.stack = stack;
+    }
+
+    public ErrorResponse(String message, int code, Throwable throwable) {
+        this.message = message;
+        this.code = code;
+        this.stack = getStackFromThrowable(throwable);
+    }
+
+    @JsonGetter(FIELD_MESSAGE)
+    public String message() {
+        return message;
+    }
+
+    @JsonGetter(FIELD_CODE)
+    public Integer code() {
+        return code;
+    }
+
+    @JsonGetter(FIELD_STACK)
+    public List<String> stack() {
+        return stack;
+    }
+
+    private List<String> getStackFromThrowable(Throwable throwable) {
+        if (throwable == null) {
+            return new ArrayList<String>();
+        }
+        StringWriter sw = new StringWriter();
+        try (PrintWriter pw = new PrintWriter(sw)) {
+            throwable.printStackTrace(pw);
+        }
+
+        return Arrays.asList(sw.toString().split("\n"));
+    }
+}
diff --git a/paimon-core/src/main/resources/META-INF/NOTICE b/paimon-core/src/main/resources/META-INF/NOTICE
new file mode 100644
index 0000000000000..dd2479b1d6e7c
--- /dev/null
+++ b/paimon-core/src/main/resources/META-INF/NOTICE
@@ -0,0 +1,8 @@
+paimon-core
+Copyright 2023-2024 The Apache Software Foundation
+
+This product includes software developed at
+The Apache Software Foundation (http://www.apache.org/).
+
+This project bundles the following dependencies under the Apache Software License 2.0 (http://www.apache.org/licenses/LICENSE-2.0.txt)
+- com.squareup.okhttp3:okhttp:4.12.0
\ No newline at end of file
diff --git a/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory b/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
index ac6cc98fed6b7..3b98eef52c851 100644
--- a/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
+++ b/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
@@ -36,3 +36,4 @@ org.apache.paimon.mergetree.compact.aggregate.factory.FieldRoaringBitmap32AggFac
 org.apache.paimon.mergetree.compact.aggregate.factory.FieldRoaringBitmap64AggFactory
 org.apache.paimon.mergetree.compact.aggregate.factory.FieldSumAggFactory
 org.apache.paimon.mergetree.compact.aggregate.factory.FieldThetaSketchAggFactory
+org.apache.paimon.rest.RESTCatalogFactory
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
new file mode 100644
index 0000000000000..1f1b9c01aace0
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.exceptions.BadRequestException;
+import org.apache.paimon.rest.exceptions.ForbiddenException;
+import org.apache.paimon.rest.exceptions.NotAuthorizedException;
+import org.apache.paimon.rest.exceptions.RESTException;
+import org.apache.paimon.rest.exceptions.ServiceFailureException;
+import org.apache.paimon.rest.exceptions.ServiceUnavailableException;
+import org.apache.paimon.rest.responses.ErrorResponse;
+
+import org.junit.Before;
+import org.junit.Test;
+
+import java.io.IOException;
+import java.util.ArrayList;
+
+import static org.junit.Assert.assertThrows;
+
+/** Test for {@link DefaultErrorHandler}. */
+public class DefaultErrorHandlerTest {
+    private ErrorHandler defaultErrorHandler;
+
+    @Before
+    public void setUp() throws IOException {
+        defaultErrorHandler = DefaultErrorHandler.getInstance();
+    }
+
+    @Test
+    public void testHandleErrorResponse() {
+        assertThrows(
+                BadRequestException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(400)));
+        assertThrows(
+                NotAuthorizedException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(401)));
+        assertThrows(
+                ForbiddenException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(403)));
+        assertThrows(
+                RESTException.class, () -> defaultErrorHandler.accept(generateErrorResponse(405)));
+        assertThrows(
+                RESTException.class, () -> defaultErrorHandler.accept(generateErrorResponse(406)));
+        assertThrows(
+                ServiceFailureException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(500)));
+        assertThrows(
+                UnsupportedOperationException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(501)));
+        assertThrows(
+                RESTException.class, () -> defaultErrorHandler.accept(generateErrorResponse(502)));
+        assertThrows(
+                ServiceUnavailableException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(503)));
+    }
+
+    private ErrorResponse generateErrorResponse(int code) {
+        return new ErrorResponse("message", code, new ArrayList<String>());
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
new file mode 100644
index 0000000000000..1140e399824cc
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
@@ -0,0 +1,129 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import okhttp3.mockwebserver.MockResponse;
+import okhttp3.mockwebserver.MockWebServer;
+import org.junit.After;
+import org.junit.Before;
+import org.junit.Test;
+
+import java.io.IOException;
+import java.time.Duration;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Optional;
+
+import static org.apache.paimon.rest.RESTCatalog.AUTH_HEADER;
+import static org.apache.paimon.rest.RESTCatalog.AUTH_HEADER_VALUE_FORMAT;
+import static org.junit.Assert.assertEquals;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+
+/** Test for {@link HttpClient}. */
+public class HttpClientTest {
+    private MockWebServer mockWebServer;
+    private HttpClient httpClient;
+    private ObjectMapper objectMapper = RESTObjectMapper.create();
+    private ErrorHandler errorHandler;
+    private MockRESTData mockResponseData;
+    private String mockResponseDataStr;
+    private Map<String, String> headers;
+    private static final String MOCK_PATH = "/v1/api/mock";
+    private static final String TOKEN = "token";
+
+    @Before
+    public void setUp() throws IOException {
+        mockWebServer = new MockWebServer();
+        mockWebServer.start();
+        String baseUrl = mockWebServer.url("").toString();
+        errorHandler = mock(ErrorHandler.class);
+        HttpClientOptions httpClientOptions =
+                new HttpClientOptions(
+                        baseUrl,
+                        Optional.of(Duration.ofSeconds(3)),
+                        Optional.of(Duration.ofSeconds(3)),
+                        objectMapper,
+                        1,
+                        errorHandler);
+        mockResponseData = new MockRESTData(MOCK_PATH);
+        mockResponseDataStr = objectMapper.writeValueAsString(mockResponseData);
+        httpClient = new HttpClient(httpClientOptions);
+        headers = ImmutableMap.of(AUTH_HEADER, String.format(AUTH_HEADER_VALUE_FORMAT, TOKEN));
+    }
+
+    @After
+    public void tearDown() throws IOException {
+        mockWebServer.shutdown();
+    }
+
+    @Test
+    public void testGetSuccess() {
+        mockHttpCallWithCode(mockResponseDataStr, 200);
+        MockRESTData response = httpClient.get(MOCK_PATH, MockRESTData.class, headers);
+        verify(errorHandler, times(0)).accept(any());
+        assertEquals(mockResponseData.data(), response.data());
+    }
+
+    @Test
+    public void testGetFail() {
+        mockHttpCallWithCode(mockResponseDataStr, 400);
+        httpClient.get(MOCK_PATH, MockRESTData.class, headers);
+        verify(errorHandler, times(1)).accept(any());
+    }
+
+    @Test
+    public void testPostSuccess() {
+        mockHttpCallWithCode(mockResponseDataStr, 200);
+        MockRESTData response =
+                httpClient.post(MOCK_PATH, mockResponseData, MockRESTData.class, headers);
+        verify(errorHandler, times(0)).accept(any());
+        assertEquals(mockResponseData.data(), response.data());
+    }
+
+    @Test
+    public void testPostFail() {
+        mockHttpCallWithCode(mockResponseDataStr, 400);
+        httpClient.post(MOCK_PATH, mockResponseData, MockRESTData.class, headers);
+        verify(errorHandler, times(1)).accept(any());
+    }
+
+    private Map<String, String> headers(String token) {
+        Map<String, String> header = new HashMap<>();
+        header.put("Authorization", "Bearer " + token);
+        return header;
+    }
+
+    private void mockHttpCallWithCode(String body, Integer code) {
+        MockResponse mockResponseObj = generateMockResponse(body, code);
+        mockWebServer.enqueue(mockResponseObj);
+    }
+
+    private MockResponse generateMockResponse(String data, Integer code) {
+        return new MockResponse()
+                .setResponseCode(code)
+                .setBody(data)
+                .addHeader("Content-Type", "application/json");
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
new file mode 100644
index 0000000000000..55c5165ada48e
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+
+import java.beans.ConstructorProperties;
+
+/** Mock REST data. */
+@JsonIgnoreProperties(ignoreUnknown = true)
+public class MockRESTData implements RESTRequest, RESTResponse {
+    private static final String FIELD_DATA = "data";
+
+    @JsonProperty(FIELD_DATA)
+    private String data;
+
+    @ConstructorProperties({FIELD_DATA})
+    public MockRESTData(String data) {
+        this.data = data;
+    }
+
+    @JsonGetter(FIELD_DATA)
+    public String data() {
+        return data;
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
new file mode 100644
index 0000000000000..3ed8730862ee5
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
@@ -0,0 +1,86 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.options.CatalogOptions;
+import org.apache.paimon.options.Options;
+
+import okhttp3.mockwebserver.MockResponse;
+import okhttp3.mockwebserver.MockWebServer;
+import org.junit.After;
+import org.junit.Before;
+import org.junit.Test;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertThrows;
+
+/** Test for REST Catalog. */
+public class RESTCatalogTest {
+    private MockWebServer mockWebServer;
+    private RESTCatalog restCatalog;
+    private final String initToken = "init_token";
+
+    @Before
+    public void setUp() throws IOException {
+        mockWebServer = new MockWebServer();
+        mockWebServer.start();
+        String baseUrl = mockWebServer.url("").toString();
+        Options options = new Options();
+        options.set(RESTCatalogOptions.URI, baseUrl);
+        options.set(RESTCatalogOptions.TOKEN, initToken);
+        options.set(RESTCatalogOptions.THREAD_POOL_SIZE, 1);
+        mockOptions(RESTCatalogInternalOptions.PREFIX.key(), "prefix");
+        restCatalog = new RESTCatalog(options);
+    }
+
+    @After
+    public void tearDown() throws IOException {
+        mockWebServer.shutdown();
+    }
+
+    @Test
+    public void testInitFailWhenDefineWarehouse() {
+        Options options = new Options();
+        options.set(CatalogOptions.WAREHOUSE, "/a/b/c");
+        assertThrows(IllegalArgumentException.class, () -> new RESTCatalog(options));
+    }
+
+    @Test
+    public void testGetConfig() {
+        String key = "a";
+        String value = "b";
+        mockOptions(key, value);
+        Map<String, String> header = new HashMap<>();
+        Map<String, String> response = restCatalog.fetchOptionsFromServer(header, new HashMap<>());
+        assertEquals(value, response.get(key));
+    }
+
+    private void mockOptions(String key, String value) {
+        String mockResponse = String.format("{\"defaults\": {\"%s\": \"%s\"}}", key, value);
+        MockResponse mockResponseObj =
+                new MockResponse()
+                        .setBody(mockResponse)
+                        .addHeader("Content-Type", "application/json");
+        mockWebServer.enqueue(mockResponseObj);
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
new file mode 100644
index 0000000000000..83a8805d29a0f
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.responses.ConfigResponse;
+import org.apache.paimon.rest.responses.ErrorResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
+
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.junit.Assert.assertEquals;
+
+/** Test for {@link RESTObjectMapper}. */
+public class RESTObjectMapperTest {
+    private ObjectMapper mapper = RESTObjectMapper.create();
+
+    @Test
+    public void configResponseParseTest() throws Exception {
+        String confKey = "a";
+        Map<String, String> conf = new HashMap<>();
+        conf.put(confKey, "b");
+        ConfigResponse response = new ConfigResponse(conf, conf);
+        String responseStr = mapper.writeValueAsString(response);
+        ConfigResponse parseData = mapper.readValue(responseStr, ConfigResponse.class);
+        assertEquals(conf.get(confKey), parseData.defaults().get(confKey));
+    }
+
+    @Test
+    public void errorResponseParseTest() throws Exception {
+        String message = "message";
+        Integer code = 400;
+        ErrorResponse response = new ErrorResponse(message, code, new ArrayList<String>());
+        String responseStr = mapper.writeValueAsString(response);
+        ErrorResponse parseData = mapper.readValue(responseStr, ErrorResponse.class);
+        assertEquals(message, parseData.message());
+        assertEquals(code, parseData.code());
+    }
+}
diff --git a/paimon-open-api/Makefile b/paimon-open-api/Makefile
new file mode 100644
index 0000000000000..c3264c83dbd02
--- /dev/null
+++ b/paimon-open-api/Makefile
@@ -0,0 +1,25 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+# See: https://cwiki.apache.org/confluence/display/INFRA/git+-+.asf.yaml+features
+
+
+install:
+	brew install yq
+
+generate:
+	@sh generate.sh
diff --git a/paimon-open-api/README.md b/paimon-open-api/README.md
new file mode 100644
index 0000000000000..9d14a7cdd3643
--- /dev/null
+++ b/paimon-open-api/README.md
@@ -0,0 +1,10 @@
+# Open API spec
+
+The `rest-catalog-open-api.yaml` defines the REST catalog interface.
+
+## Generate Open API Spec
+```sh
+make install
+cd paimon-open-api
+make generate
+```
\ No newline at end of file
diff --git a/paimon-open-api/generate.sh b/paimon-open-api/generate.sh
new file mode 100755
index 0000000000000..b63aa538abc45
--- /dev/null
+++ b/paimon-open-api/generate.sh
@@ -0,0 +1,48 @@
+#!/bin/bash
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Start the application
+cd ..
+mvn clean install -DskipTests
+cd ./paimon-open-api
+mvn spring-boot:run &
+SPRING_PID=$!
+# Wait for the application to be ready
+RETRY_COUNT=0
+MAX_RETRIES=10
+SLEEP_DURATION=5
+
+until $(curl -s -o /dev/null -w "%{http_code}" http://localhost:8080/swagger-api-docs | grep -q "200"); do
+    ((RETRY_COUNT++))
+    if [ $RETRY_COUNT -gt $MAX_RETRIES ]; then
+        echo "Failed to start the application after $MAX_RETRIES retries."
+        exit 1
+    fi
+    echo "Application not ready yet. Retrying in $SLEEP_DURATION seconds..."
+    sleep $SLEEP_DURATION
+done
+
+echo "Application is ready".
+
+# Generate the OpenAPI specification file
+curl -s "http://localhost:8080/swagger-api-docs" | jq -M > ./rest-catalog-open-api.json
+yq --prettyPrint -o=yaml ./rest-catalog-open-api.json > ./rest-catalog-open-api.yaml
+rm -rf ./rest-catalog-open-api.json
+mvn spotless:apply
+# Stop the application
+echo "Stopping application..."
+kill $SPRING_PID
\ No newline at end of file
diff --git a/paimon-open-api/pom.xml b/paimon-open-api/pom.xml
new file mode 100644
index 0000000000000..b5cee29fe4e7f
--- /dev/null
+++ b/paimon-open-api/pom.xml
@@ -0,0 +1,85 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+    <parent>
+        <groupId>org.apache.paimon</groupId>
+        <artifactId>paimon-parent</artifactId>
+        <version>1.0-SNAPSHOT</version>
+    </parent>
+
+    <artifactId>paimon-open-api</artifactId>
+
+    <properties>
+        <maven.compiler.source>8</maven.compiler.source>
+        <maven.compiler.target>8</maven.compiler.target>
+        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+    </properties>
+    <dependencies>
+        <dependency>
+            <groupId>org.springframework.boot</groupId>
+            <artifactId>spring-boot-starter-web</artifactId>
+            <version>2.7.18</version>
+            <exclusions>
+                <exclusion>
+                    <groupId>ch.qos.logback</groupId>
+                    <artifactId>logback-classic</artifactId>
+                </exclusion>
+            </exclusions>
+        </dependency>
+
+        <!-- https://mvnrepository.com/artifact/org.springdoc/springdoc-openapi-ui -->
+        <dependency>
+            <groupId>org.springdoc</groupId>
+            <artifactId>springdoc-openapi-ui</artifactId>
+            <version>1.7.0</version>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.paimon</groupId>
+            <artifactId>paimon-core</artifactId>
+            <version>${project.version}</version>
+        </dependency>
+        <dependency>
+            <groupId>io.swagger.core.v3</groupId>
+            <artifactId>swagger-annotations</artifactId>
+            <version>2.2.20</version>
+        </dependency>
+    </dependencies>
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.springframework.boot</groupId>
+                <artifactId>spring-boot-maven-plugin</artifactId>
+                <version>2.7.6</version>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <configuration>
+                    <source>8</source>
+                    <target>8</target>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+
+</project>
\ No newline at end of file
diff --git a/paimon-open-api/rest-catalog-open-api.yaml b/paimon-open-api/rest-catalog-open-api.yaml
new file mode 100644
index 0000000000000..432ee123b8d43
--- /dev/null
+++ b/paimon-open-api/rest-catalog-open-api.yaml
@@ -0,0 +1,60 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+---
+openapi: 3.0.1
+info:
+  title: RESTCatalog API
+  description: This API exposes endpoints to RESTCatalog.
+  license:
+    name: Apache 2.0
+    url: https://www.apache.org/licenses/LICENSE-2.0.html
+  version: "1.0"
+servers:
+  - url: http://localhost:8080
+    description: Server URL in Development environment
+paths:
+  /api/v1/config:
+    get:
+      tags:
+        - config
+      summary: Get Config
+      operationId: getConfig
+      responses:
+        "500":
+          description: Internal Server Error
+        "201":
+          description: Created
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ConfigResponse'
+components:
+  schemas:
+    ConfigResponse:
+      type: object
+      properties:
+        defaults:
+          type: object
+          additionalProperties:
+            type: string
+          writeOnly: true
+        overrides:
+          type: object
+          additionalProperties:
+            type: string
+          writeOnly: true
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/OpenApiApplication.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/OpenApiApplication.java
new file mode 100644
index 0000000000000..76ce4cbf83c61
--- /dev/null
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/OpenApiApplication.java
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.open.api;
+
+import org.springframework.boot.SpringApplication;
+import org.springframework.boot.autoconfigure.SpringBootApplication;
+
+/** OpenAPI application. */
+@SpringBootApplication
+public class OpenApiApplication {
+
+    public static void main(String[] args) {
+        SpringApplication.run(OpenApiApplication.class, args);
+    }
+}
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
new file mode 100644
index 0000000000000..b475540571054
--- /dev/null
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.open.api;
+
+import org.apache.paimon.rest.ResourcePaths;
+import org.apache.paimon.rest.responses.ConfigResponse;
+
+import io.swagger.v3.oas.annotations.Operation;
+import io.swagger.v3.oas.annotations.media.Content;
+import io.swagger.v3.oas.annotations.media.Schema;
+import io.swagger.v3.oas.annotations.responses.ApiResponse;
+import io.swagger.v3.oas.annotations.responses.ApiResponses;
+import org.springframework.http.HttpStatus;
+import org.springframework.http.ResponseEntity;
+import org.springframework.web.bind.annotation.CrossOrigin;
+import org.springframework.web.bind.annotation.GetMapping;
+import org.springframework.web.bind.annotation.RestController;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/** * RESTCatalog management APIs. */
+@CrossOrigin(origins = "http://localhost:8081")
+@RestController
+public class RESTCatalogController {
+
+    @Operation(
+            summary = "Get Config",
+            tags = {"config"})
+    @ApiResponses({
+        @ApiResponse(
+                responseCode = "201",
+                content = {
+                    @Content(
+                            schema = @Schema(implementation = ConfigResponse.class),
+                            mediaType = "application/json")
+                }),
+        @ApiResponse(
+                responseCode = "500",
+                content = {@Content(schema = @Schema())})
+    })
+    @GetMapping(ResourcePaths.V1_CONFIG)
+    public ResponseEntity<ConfigResponse> getConfig() {
+        try {
+            Map<String, String> defaults = new HashMap<>();
+            Map<String, String> overrides = new HashMap<>();
+            ConfigResponse response = new ConfigResponse(defaults, overrides);
+            return new ResponseEntity<>(response, HttpStatus.CREATED);
+        } catch (Exception e) {
+            return new ResponseEntity<>(null, HttpStatus.INTERNAL_SERVER_ERROR);
+        }
+    }
+}
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
new file mode 100644
index 0000000000000..01234c41bbff4
--- /dev/null
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.open.api.config;
+
+import io.swagger.v3.oas.models.OpenAPI;
+import io.swagger.v3.oas.models.info.Info;
+import io.swagger.v3.oas.models.info.License;
+import io.swagger.v3.oas.models.servers.Server;
+import org.springframework.beans.factory.annotation.Value;
+import org.springframework.context.annotation.Bean;
+import org.springframework.context.annotation.Configuration;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/** Config for OpenAPI. */
+@Configuration
+public class OpenAPIConfig {
+
+    @Value("${openapi.url}")
+    private String devUrl;
+
+    @Bean
+    public OpenAPI restCatalogOpenAPI() {
+        Server server = new Server();
+        server.setUrl(devUrl);
+        server.setDescription("Server URL in Development environment");
+
+        License mitLicense =
+                new License()
+                        .name("Apache 2.0")
+                        .url("https://www.apache.org/licenses/LICENSE-2.0.html");
+
+        Info info =
+                new Info()
+                        .title("RESTCatalog API")
+                        .version("1.0")
+                        .description("This API exposes endpoints to RESTCatalog.")
+                        .license(mitLicense);
+        List<Server> servers = new ArrayList<>();
+        servers.add(server);
+        return new OpenAPI().info(info).servers(servers);
+    }
+}
diff --git a/paimon-open-api/src/main/resources/application.properties b/paimon-open-api/src/main/resources/application.properties
new file mode 100644
index 0000000000000..58a975161145b
--- /dev/null
+++ b/paimon-open-api/src/main/resources/application.properties
@@ -0,0 +1,22 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+springdoc.swagger-ui.path=/swagger-api
+springdoc.api-docs.path=/swagger-api-docs
+springdoc.swagger-ui.deepLinking=true
+springdoc.swagger-ui.tryItOutEnabled=true
+springdoc.swagger-ui.filter=true
+openapi.url=http://localhost:8080
diff --git a/pom.xml b/pom.xml
index 85a880f35158e..904b1c73c7414 100644
--- a/pom.xml
+++ b/pom.xml
@@ -69,6 +69,7 @@ under the License.
         <module>paimon-test-utils</module>
         <module>paimon-arrow</module>
         <module>tools/ci/paimon-ci-tools</module>
+        <module>paimon-open-api</module>
     </modules>
 
     <properties>

From 2816811fc69a8209f0674418765a11cd2adf46d5 Mon Sep 17 00:00:00 2001
From: Steven <54518670+yangjf2019@users.noreply.github.com>
Date: Thu, 28 Nov 2024 19:59:53 +0800
Subject: [PATCH 078/157] =?UTF-8?q?[doc]=20fix=20the=20=E2=80=98primary-ke?=
 =?UTF-8?q?y-table=E2=80=99=20link=20(#4606)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 docs/content/flink/action-jars.md | 2 +-
 docs/content/flink/sql-write.md   | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/content/flink/action-jars.md b/docs/content/flink/action-jars.md
index 34e911ff6feba..69f9dda1fdcbe 100644
--- a/docs/content/flink/action-jars.md
+++ b/docs/content/flink/action-jars.md
@@ -50,7 +50,7 @@ Paimon supports "MERGE INTO" via submitting the 'merge_into' job through `flink
 
 {{< hint info >}}
 Important table properties setting:
-1. Only [primary key table]({{< ref "primary-key-table" >}}) supports this feature.
+1. Only [primary key table]({{< ref "primary-key-table/overview" >}}) supports this feature.
 2. The action won't produce UPDATE_BEFORE, so it's not recommended to set 'changelog-producer' = 'input'.
    {{< /hint >}}
 
diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 58e90a8f6e3f5..3b6a0498eb279 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -175,7 +175,7 @@ PARTITION (k0 = 0, k1 = 0) SELECT v FROM my_table WHERE false;
 
 {{< hint info >}}
 Important table properties setting:
-1. Only [primary key table]({{< ref "primary-key-table" >}}) supports this feature.
+1. Only [primary key table]({{< ref "primary-key-table/overview" >}}) supports this feature.
 2. [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine#deduplicate" >}})
    or [partial-update]({{< ref "primary-key-table/merge-engine#partial-update" >}}) to support this feature.
 3. Do not support updating primary keys.

From fdcdd09ca09d009b4051fe319cef6050ae58d110 Mon Sep 17 00:00:00 2001
From: WenjunMin <aitozi@apache.org>
Date: Thu, 28 Nov 2024 20:01:37 +0800
Subject: [PATCH 079/157] [core] Avoid extract from file footer when stats mode
 is none (#4604)

---
 .../io/StatsCollectingSingleFileWriter.java   | 20 ++++++++++++++++++-
 1 file changed, 19 insertions(+), 1 deletion(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/StatsCollectingSingleFileWriter.java b/paimon-core/src/main/java/org/apache/paimon/io/StatsCollectingSingleFileWriter.java
index 2f4190a049dc4..67a3fa6d1acea 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/StatsCollectingSingleFileWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/StatsCollectingSingleFileWriter.java
@@ -25,6 +25,7 @@
 import org.apache.paimon.format.SimpleStatsExtractor;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.statistics.NoneSimpleColStatsCollector;
 import org.apache.paimon.statistics.SimpleColStatsCollector;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.Preconditions;
@@ -32,7 +33,9 @@
 import javax.annotation.Nullable;
 
 import java.io.IOException;
+import java.util.Arrays;
 import java.util.function.Function;
+import java.util.stream.IntStream;
 
 /**
  * A {@link SingleFileWriter} which also produces statistics for each written field.
@@ -44,6 +47,8 @@ public abstract class StatsCollectingSingleFileWriter<T, R> extends SingleFileWr
 
     @Nullable private final SimpleStatsExtractor simpleStatsExtractor;
     @Nullable private SimpleStatsCollector simpleStatsCollector = null;
+    @Nullable private SimpleColStats[] noneStats = null;
+    private final boolean isStatsDisabled;
 
     public StatsCollectingSingleFileWriter(
             FileIO fileIO,
@@ -63,6 +68,15 @@ public StatsCollectingSingleFileWriter(
         Preconditions.checkArgument(
                 statsCollectors.length == writeSchema.getFieldCount(),
                 "The stats collector is not aligned to write schema.");
+        this.isStatsDisabled =
+                Arrays.stream(SimpleColStatsCollector.create(statsCollectors))
+                        .allMatch(p -> p instanceof NoneSimpleColStatsCollector);
+        if (isStatsDisabled) {
+            this.noneStats =
+                    IntStream.range(0, statsCollectors.length)
+                            .mapToObj(i -> SimpleColStats.NONE)
+                            .toArray(SimpleColStats[]::new);
+        }
     }
 
     @Override
@@ -85,7 +99,11 @@ public void writeBundle(BundleRecords bundle) throws IOException {
     public SimpleColStats[] fieldStats() throws IOException {
         Preconditions.checkState(closed, "Cannot access metric unless the writer is closed.");
         if (simpleStatsExtractor != null) {
-            return simpleStatsExtractor.extract(fileIO, path);
+            if (isStatsDisabled) {
+                return noneStats;
+            } else {
+                return simpleStatsExtractor.extract(fileIO, path);
+            }
         } else {
             return simpleStatsCollector.extract();
         }

From 2f93b7b2dbc3a659f3b25bcff6c23aee4218ebfe Mon Sep 17 00:00:00 2001
From: Gang Yang <yanggang_IT_job@163.com>
Date: Thu, 28 Nov 2024 20:02:30 +0800
Subject: [PATCH 080/157] [cdc] Add the latest_schema state at schema evolution
 operator to reduce the latest schema access frequency (#4535)

---
 .../apache/paimon/types/FieldIdentifier.java  |  53 +++++
 .../cdc/UpdatedDataFieldsProcessFunction.java |  41 +++-
 .../flink/action/cdc/SchemaEvolutionTest.java | 219 ++++++++++++++++++
 3 files changed, 312 insertions(+), 1 deletion(-)
 create mode 100644 paimon-common/src/main/java/org/apache/paimon/types/FieldIdentifier.java
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/SchemaEvolutionTest.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/types/FieldIdentifier.java b/paimon-common/src/main/java/org/apache/paimon/types/FieldIdentifier.java
new file mode 100644
index 0000000000000..7e9ced7cf95ac
--- /dev/null
+++ b/paimon-common/src/main/java/org/apache/paimon/types/FieldIdentifier.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.types;
+
+import java.util.Objects;
+
+/** Used to indicate the uniqueness of a field. */
+public class FieldIdentifier {
+    private String name;
+    private DataType type;
+    private String description;
+
+    public FieldIdentifier(DataField dataField) {
+        this.name = dataField.name();
+        this.type = dataField.type();
+        this.description = dataField.description();
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (o == null || getClass() != o.getClass()) {
+            return false;
+        }
+        FieldIdentifier field = (FieldIdentifier) o;
+        return Objects.equals(name, field.name)
+                && Objects.equals(type, field.type)
+                && Objects.equals(description, field.description);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(name, type, description);
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunction.java
index 4a33eb1b7ec94..64f00d96b0f51 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/UpdatedDataFieldsProcessFunction.java
@@ -23,11 +23,18 @@
 import org.apache.paimon.schema.SchemaChange;
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.FieldIdentifier;
+import org.apache.paimon.types.RowType;
 
+import org.apache.commons.collections.CollectionUtils;
 import org.apache.flink.streaming.api.functions.ProcessFunction;
 import org.apache.flink.util.Collector;
 
+import java.util.HashSet;
 import java.util.List;
+import java.util.Objects;
+import java.util.Set;
+import java.util.stream.Collectors;
 
 /**
  * A {@link ProcessFunction} to handle schema changes. New schema is represented by a list of {@link
@@ -43,19 +50,51 @@ public class UpdatedDataFieldsProcessFunction
 
     private final Identifier identifier;
 
+    private Set<FieldIdentifier> latestFields;
+
     public UpdatedDataFieldsProcessFunction(
             SchemaManager schemaManager, Identifier identifier, Catalog.Loader catalogLoader) {
         super(catalogLoader);
         this.schemaManager = schemaManager;
         this.identifier = identifier;
+        this.latestFields = new HashSet<>();
     }
 
     @Override
     public void processElement(
             List<DataField> updatedDataFields, Context context, Collector<Void> collector)
             throws Exception {
-        for (SchemaChange schemaChange : extractSchemaChanges(schemaManager, updatedDataFields)) {
+        List<DataField> actualUpdatedDataFields =
+                updatedDataFields.stream()
+                        .filter(
+                                dataField ->
+                                        !latestDataFieldContain(new FieldIdentifier(dataField)))
+                        .collect(Collectors.toList());
+        if (CollectionUtils.isEmpty(actualUpdatedDataFields)) {
+            return;
+        }
+        for (SchemaChange schemaChange :
+                extractSchemaChanges(schemaManager, actualUpdatedDataFields)) {
             applySchemaChange(schemaManager, schemaChange, identifier);
         }
+        /**
+         * Here, actualUpdatedDataFields cannot be used to update latestFields because there is a
+         * non-SchemaChange.AddColumn scenario. Otherwise, the previously existing fields cannot be
+         * modified again.
+         */
+        updateLatestFields();
+    }
+
+    private boolean latestDataFieldContain(FieldIdentifier dataField) {
+        return latestFields.stream().anyMatch(previous -> Objects.equals(previous, dataField));
+    }
+
+    private void updateLatestFields() {
+        RowType oldRowType = schemaManager.latest().get().logicalRowType();
+        Set<FieldIdentifier> fieldIdentifiers =
+                oldRowType.getFields().stream()
+                        .map(item -> new FieldIdentifier(item))
+                        .collect(Collectors.toSet());
+        latestFields = fieldIdentifiers;
     }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/SchemaEvolutionTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/SchemaEvolutionTest.java
new file mode 100644
index 0000000000000..9ba18376867ff
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/SchemaEvolutionTest.java
@@ -0,0 +1,219 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.flink.FlinkCatalogFactory;
+import org.apache.paimon.flink.sink.cdc.UpdatedDataFieldsProcessFunction;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.fs.local.LocalFileIO;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.schema.SchemaManager;
+import org.apache.paimon.schema.SchemaUtils;
+import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.FileStoreTableFactory;
+import org.apache.paimon.table.TableTestBase;
+import org.apache.paimon.types.BigIntType;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.DecimalType;
+import org.apache.paimon.types.DoubleType;
+import org.apache.paimon.types.IntType;
+import org.apache.paimon.types.VarCharType;
+
+import org.apache.flink.streaming.api.datastream.DataStream;
+import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+
+import java.util.Arrays;
+import java.util.List;
+
+/** Used to test schema evolution related logic. */
+public class SchemaEvolutionTest extends TableTestBase {
+
+    private static List<List<DataField>> prepareData() {
+        List<DataField> upField1 =
+                Arrays.asList(
+                        new DataField(0, "col_0", new VarCharType(), "test description."),
+                        new DataField(1, "col_1", new IntType(), "test description."),
+                        new DataField(2, "col_2", new IntType(), "test description."),
+                        new DataField(3, "col_3", new VarCharType(), "Someone's desc."),
+                        new DataField(4, "col_4", new VarCharType(), "Someone's desc."),
+                        new DataField(5, "col_5", new VarCharType(), "Someone's desc."),
+                        new DataField(6, "col_6", new DecimalType(), "Someone's desc."),
+                        new DataField(7, "col_7", new VarCharType(), "Someone's desc."),
+                        new DataField(8, "col_8", new VarCharType(), "Someone's desc."),
+                        new DataField(9, "col_9", new VarCharType(), "Someone's desc."),
+                        new DataField(10, "col_10", new VarCharType(), "Someone's desc."),
+                        new DataField(11, "col_11", new VarCharType(), "Someone's desc."),
+                        new DataField(12, "col_12", new DoubleType(), "Someone's desc."),
+                        new DataField(13, "col_13", new VarCharType(), "Someone's desc."),
+                        new DataField(14, "col_14", new VarCharType(), "Someone's desc."),
+                        new DataField(15, "col_15", new VarCharType(), "Someone's desc."),
+                        new DataField(16, "col_16", new VarCharType(), "Someone's desc."),
+                        new DataField(17, "col_17", new VarCharType(), "Someone's desc."),
+                        new DataField(18, "col_18", new VarCharType(), "Someone's desc."),
+                        new DataField(19, "col_19", new VarCharType(), "Someone's desc."),
+                        new DataField(20, "col_20", new VarCharType(), "Someone's desc."));
+        List<DataField> upField2 =
+                Arrays.asList(
+                        new DataField(0, "col_0", new VarCharType(), "test description."),
+                        new DataField(1, "col_1", new BigIntType(), "test description."),
+                        new DataField(2, "col_2", new IntType(), "test description."),
+                        new DataField(3, "col_3", new VarCharType(), "Someone's desc."),
+                        new DataField(4, "col_4", new VarCharType(), "Someone's desc."),
+                        new DataField(5, "col_5", new VarCharType(), "Someone's desc."),
+                        new DataField(6, "col_6", new DecimalType(), "Someone's desc."),
+                        new DataField(7, "col_7", new VarCharType(), "Someone's desc."),
+                        new DataField(8, "col_8", new VarCharType(), "Someone's desc."),
+                        new DataField(9, "col_9", new VarCharType(), "Someone's desc."),
+                        new DataField(10, "col_10", new VarCharType(), "Someone's desc."),
+                        new DataField(11, "col_11", new VarCharType(), "Someone's desc."),
+                        new DataField(12, "col_12", new DoubleType(), "Someone's desc."),
+                        new DataField(13, "col_13", new VarCharType(), "Someone's desc."),
+                        new DataField(14, "col_14", new VarCharType(), "Someone's desc."),
+                        new DataField(15, "col_15", new VarCharType(), "Someone's desc."),
+                        new DataField(16, "col_16", new VarCharType(), "Someone's desc."),
+                        new DataField(17, "col_17", new VarCharType(), "Someone's desc."),
+                        new DataField(18, "col_18", new VarCharType(), "Someone's desc."),
+                        new DataField(19, "col_19", new VarCharType(), "Someone's desc."),
+                        new DataField(20, "col_20", new VarCharType(), "Someone's desc."));
+        List<DataField> upField3 =
+                Arrays.asList(
+                        new DataField(0, "col_0", new VarCharType(), "test description."),
+                        new DataField(1, "col_1", new BigIntType(), "test description."),
+                        new DataField(2, "col_2", new IntType(), "test description 2."),
+                        new DataField(3, "col_3", new VarCharType(), "Someone's desc."),
+                        new DataField(4, "col_4", new VarCharType(), "Someone's desc."),
+                        new DataField(5, "col_5", new VarCharType(), "Someone's desc."),
+                        new DataField(6, "col_6", new DecimalType(), "Someone's desc."),
+                        new DataField(7, "col_7", new VarCharType(), "Someone's desc."),
+                        new DataField(8, "col_8", new VarCharType(), "Someone's desc."),
+                        new DataField(9, "col_9", new VarCharType(), "Someone's desc."),
+                        new DataField(10, "col_10", new VarCharType(), "Someone's desc."),
+                        new DataField(11, "col_11", new VarCharType(), "Someone's desc."),
+                        new DataField(12, "col_12", new DoubleType(), "Someone's desc."),
+                        new DataField(13, "col_13", new VarCharType(), "Someone's desc."),
+                        new DataField(14, "col_14", new VarCharType(), "Someone's desc."),
+                        new DataField(15, "col_15", new VarCharType(), "Someone's desc."),
+                        new DataField(16, "col_16", new VarCharType(), "Someone's desc."),
+                        new DataField(17, "col_17", new VarCharType(), "Someone's desc."),
+                        new DataField(18, "col_18", new VarCharType(), "Someone's desc."),
+                        new DataField(19, "col_19", new VarCharType(), "Someone's desc."),
+                        new DataField(20, "col_20", new VarCharType(), "Someone's desc."));
+        List<DataField> upField4 =
+                Arrays.asList(
+                        new DataField(0, "col_0", new VarCharType(), "test description."),
+                        new DataField(1, "col_1", new BigIntType(), "test description."),
+                        new DataField(2, "col_2", new IntType(), "test description."),
+                        new DataField(3, "col_3_1", new VarCharType(), "Someone's desc."),
+                        new DataField(4, "col_4", new VarCharType(), "Someone's desc."),
+                        new DataField(5, "col_5", new VarCharType(), "Someone's desc."),
+                        new DataField(6, "col_6", new DecimalType(), "Someone's desc."),
+                        new DataField(7, "col_7", new VarCharType(), "Someone's desc."),
+                        new DataField(8, "col_8", new VarCharType(), "Someone's desc."),
+                        new DataField(9, "col_9", new VarCharType(), "Someone's desc."),
+                        new DataField(10, "col_10", new VarCharType(), "Someone's desc."),
+                        new DataField(11, "col_11", new VarCharType(), "Someone's desc."),
+                        new DataField(12, "col_12", new DoubleType(), "Someone's desc."),
+                        new DataField(13, "col_13", new VarCharType(), "Someone's desc."),
+                        new DataField(14, "col_14", new VarCharType(), "Someone's desc."),
+                        new DataField(15, "col_15", new VarCharType(), "Someone's desc."),
+                        new DataField(16, "col_16", new VarCharType(), "Someone's desc."),
+                        new DataField(17, "col_17", new VarCharType(), "Someone's desc."),
+                        new DataField(18, "col_18", new VarCharType(), "Someone's desc."),
+                        new DataField(19, "col_19", new VarCharType(), "Someone's desc."),
+                        new DataField(20, "col_20", new VarCharType(), "Someone's desc."));
+        List<DataField> upField5 =
+                Arrays.asList(
+                        new DataField(0, "col_0", new VarCharType(), "test description."),
+                        new DataField(1, "col_1", new BigIntType(), "test description."),
+                        new DataField(2, "col_2_1", new BigIntType(), "test description 2."),
+                        new DataField(3, "col_3", new VarCharType(), "Someone's desc."),
+                        new DataField(4, "col_4", new VarCharType(), "Someone's desc."),
+                        new DataField(5, "col_5", new VarCharType(), "Someone's desc."),
+                        new DataField(6, "col_6", new DecimalType(), "Someone's desc."),
+                        new DataField(7, "col_7", new VarCharType(), "Someone's desc."),
+                        new DataField(8, "col_8", new VarCharType(), "Someone's desc."),
+                        new DataField(9, "col_9", new VarCharType(), "Someone's desc."),
+                        new DataField(10, "col_10", new VarCharType(), "Someone's desc."),
+                        new DataField(11, "col_11", new VarCharType(), "Someone's desc."),
+                        new DataField(12, "col_12", new DoubleType(), "Someone's desc."),
+                        new DataField(13, "col_13", new VarCharType(), "Someone's desc."),
+                        new DataField(14, "col_14", new VarCharType(), "Someone's desc."),
+                        new DataField(15, "col_15", new VarCharType(), "Someone's desc."),
+                        new DataField(16, "col_16", new VarCharType(), "Someone's desc."),
+                        new DataField(17, "col_17", new VarCharType(), "Someone's desc."),
+                        new DataField(18, "col_18", new VarCharType(), "Someone's desc."),
+                        new DataField(19, "col_19", new VarCharType(), "Someone's desc."),
+                        new DataField(20, "col_20", new VarCharType(), "Someone's desc."));
+        return Arrays.asList(upField1, upField2, upField3, upField4, upField5);
+    }
+
+    private FileStoreTable table;
+    private String tableName = "MyTable";
+
+    @BeforeEach
+    public void before() throws Exception {
+        FileIO fileIO = LocalFileIO.create();
+        Path tablePath = new Path(String.format("%s/%s.db/%s", warehouse, database, tableName));
+        Schema schema =
+                Schema.newBuilder()
+                        .column("pk", DataTypes.INT())
+                        .column("pt1", DataTypes.INT())
+                        .column("pt2", DataTypes.INT())
+                        .column("col1", DataTypes.INT())
+                        .partitionKeys("pt1", "pt2")
+                        .primaryKey("pk", "pt1", "pt2")
+                        .option(CoreOptions.CHANGELOG_PRODUCER.key(), "input")
+                        .option(CoreOptions.BUCKET.key(), "2")
+                        .option(CoreOptions.SEQUENCE_FIELD.key(), "col1")
+                        .build();
+        TableSchema tableSchema =
+                SchemaUtils.forceCommit(new SchemaManager(fileIO, tablePath), schema);
+        table = FileStoreTableFactory.create(LocalFileIO.create(), tablePath, tableSchema);
+    }
+
+    @Test
+    public void testSchemaEvolution() throws Exception {
+        final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
+        DataStream<List<DataField>> upDataFieldStream = env.fromCollection(prepareData());
+        Options options = new Options();
+        options.set("warehouse", tempPath.toString());
+        final Catalog.Loader catalogLoader = () -> FlinkCatalogFactory.createPaimonCatalog(options);
+        Identifier identifier = Identifier.create(database, tableName);
+        DataStream<Void> schemaChangeProcessFunction =
+                upDataFieldStream
+                        .process(
+                                new UpdatedDataFieldsProcessFunction(
+                                        new SchemaManager(table.fileIO(), table.location()),
+                                        identifier,
+                                        catalogLoader))
+                        .name("Schema Evolution");
+        schemaChangeProcessFunction.getTransformation().setParallelism(1);
+        schemaChangeProcessFunction.getTransformation().setMaxParallelism(1);
+        env.execute();
+    }
+}

From 9a89def5694b95ebed3dc491b52e10079b601959 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 28 Nov 2024 20:07:57 +0800
Subject: [PATCH 081/157] [pom] Add name to paimon-open-api

---
 paimon-open-api/pom.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/paimon-open-api/pom.xml b/paimon-open-api/pom.xml
index b5cee29fe4e7f..9422852432705 100644
--- a/paimon-open-api/pom.xml
+++ b/paimon-open-api/pom.xml
@@ -28,6 +28,7 @@ under the License.
     </parent>
 
     <artifactId>paimon-open-api</artifactId>
+    <name>Paimon : Open API</name>
 
     <properties>
         <maven.compiler.source>8</maven.compiler.source>

From 475e48791b873c516c4c26774cda3b45a268cd70 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Fri, 29 Nov 2024 20:38:47 +0800
Subject: [PATCH 082/157] [core] Remove all lineage implementation (#4607)

---
 .../generated/catalog_configuration.html      |   6 -
 .../org/apache/paimon/factories/Factory.java  |   2 +-
 .../paimon/lineage/DataLineageEntity.java     |  33 ---
 .../apache/paimon/lineage/LineageMeta.java    | 102 ---------
 .../paimon/lineage/LineageMetaFactory.java    |  37 ----
 .../paimon/lineage/TableLineageEntity.java    |  32 ---
 .../lineage/TableLineageEntityImpl.java       |  56 -----
 .../apache/paimon/options/CatalogOptions.java |  22 --
 .../paimon/catalog/AbstractCatalog.java       |  26 +--
 .../paimon/table/CatalogEnvironment.java      |  18 +-
 .../table/system/SinkTableLineageTable.java   |  64 ------
 .../table/system/SourceTableLineageTable.java |  64 ------
 .../table/system/SystemTableLoader.java       |  29 +--
 .../table/system/TableLineageTable.java       | 168 --------------
 .../flink/AbstractFlinkTableFactory.java      |  58 +----
 .../paimon/flink/CatalogTableITCase.java      |   6 +-
 .../paimon/flink/FlinkLineageITCase.java      | 206 ------------------
 .../org.apache.paimon.factories.Factory       |   3 -
 .../org/apache/paimon/hive/HiveCatalog.java   |   3 +-
 19 files changed, 12 insertions(+), 923 deletions(-)
 delete mode 100644 paimon-common/src/main/java/org/apache/paimon/lineage/DataLineageEntity.java
 delete mode 100644 paimon-common/src/main/java/org/apache/paimon/lineage/LineageMeta.java
 delete mode 100644 paimon-common/src/main/java/org/apache/paimon/lineage/LineageMetaFactory.java
 delete mode 100644 paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntity.java
 delete mode 100644 paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntityImpl.java
 delete mode 100644 paimon-core/src/main/java/org/apache/paimon/table/system/SinkTableLineageTable.java
 delete mode 100644 paimon-core/src/main/java/org/apache/paimon/table/system/SourceTableLineageTable.java
 delete mode 100644 paimon-core/src/main/java/org/apache/paimon/table/system/TableLineageTable.java
 delete mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkLineageITCase.java

diff --git a/docs/layouts/shortcodes/generated/catalog_configuration.html b/docs/layouts/shortcodes/generated/catalog_configuration.html
index 6706d5c421a1b..63f7adda1e0df 100644
--- a/docs/layouts/shortcodes/generated/catalog_configuration.html
+++ b/docs/layouts/shortcodes/generated/catalog_configuration.html
@@ -86,12 +86,6 @@
             <td>Boolean</td>
             <td>Whether to support format tables, format table corresponds to a regular csv, parquet or orc table, allowing read and write operations. However, during these processes, it does not connect to the metastore; hence, newly added partitions will not be reflected in the metastore and need to be manually added as separate partition operations.</td>
         </tr>
-        <tr>
-            <td><h5>lineage-meta</h5></td>
-            <td style="word-wrap: break-word;">(none)</td>
-            <td>String</td>
-            <td>The lineage meta to store table and data lineage information.<br /><br />Possible values:<br /><ul><li>"jdbc": Use standard jdbc to store table and data lineage information.</li></ul><ul><li>"custom": You can implement LineageMetaFactory and LineageMeta to store lineage information in customized storage.</li></ul></td>
-        </tr>
         <tr>
             <td><h5>lock-acquire-timeout</h5></td>
             <td style="word-wrap: break-word;">8 min</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/factories/Factory.java b/paimon-common/src/main/java/org/apache/paimon/factories/Factory.java
index b0f1ec84c1706..74796879ef4bf 100644
--- a/paimon-common/src/main/java/org/apache/paimon/factories/Factory.java
+++ b/paimon-common/src/main/java/org/apache/paimon/factories/Factory.java
@@ -20,7 +20,7 @@
 
 /**
  * Base interface for all kind of factories that create object instances from a list of key-value
- * pairs in Paimon's catalog, lineage.
+ * pairs in Paimon's catalog.
  *
  * <p>A factory is uniquely identified by {@link Class} and {@link #identifier()}.
  *
diff --git a/paimon-common/src/main/java/org/apache/paimon/lineage/DataLineageEntity.java b/paimon-common/src/main/java/org/apache/paimon/lineage/DataLineageEntity.java
deleted file mode 100644
index e7401a9be3b76..0000000000000
--- a/paimon-common/src/main/java/org/apache/paimon/lineage/DataLineageEntity.java
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.lineage;
-
-import org.apache.paimon.data.Timestamp;
-
-/**
- * Data lineage entity with table lineage, barrier id and snapshot id for table source and sink
- * lineage.
- */
-public interface DataLineageEntity extends TableLineageEntity {
-    long getBarrierId();
-
-    long getSnapshotId();
-
-    Timestamp getCreateTime();
-}
diff --git a/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMeta.java b/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMeta.java
deleted file mode 100644
index 5d1c42daf6c80..0000000000000
--- a/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMeta.java
+++ /dev/null
@@ -1,102 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.lineage;
-
-import org.apache.paimon.predicate.Predicate;
-
-import javax.annotation.Nullable;
-
-import java.util.Iterator;
-
-/** Metadata store will manage table lineage and data lineage information for the catalog. */
-public interface LineageMeta extends AutoCloseable {
-    /**
-     * Save the source table and job lineage.
-     *
-     * @param entity the table lineage entity
-     */
-    void saveSourceTableLineage(TableLineageEntity entity);
-
-    /**
-     * Delete the source table lineage for given job.
-     *
-     * @param job the job for table lineage
-     */
-    void deleteSourceTableLineage(String job);
-
-    /**
-     * Get source table and job lineages.
-     *
-     * @param predicate the predicate for the table lineages
-     * @return the iterator for source table and job lineages
-     */
-    Iterator<TableLineageEntity> sourceTableLineages(@Nullable Predicate predicate);
-
-    /**
-     * Save the sink table and job lineage.
-     *
-     * @param entity the table lineage entity
-     */
-    void saveSinkTableLineage(TableLineageEntity entity);
-
-    /**
-     * Get sink table and job lineages.
-     *
-     * @param predicate the predicate for the table lineages
-     * @return the iterator for sink table and job lineages
-     */
-    Iterator<TableLineageEntity> sinkTableLineages(@Nullable Predicate predicate);
-
-    /**
-     * Delete the sink table lineage for given job.
-     *
-     * @param job the job for table lineage
-     */
-    void deleteSinkTableLineage(String job);
-
-    /**
-     * Save the source table and job lineage.
-     *
-     * @param entity the data lineage entity
-     */
-    void saveSourceDataLineage(DataLineageEntity entity);
-
-    /**
-     * Get source data and job lineages.
-     *
-     * @param predicate the predicate for the table lineages
-     * @return the iterator for source table and job lineages
-     */
-    Iterator<DataLineageEntity> sourceDataLineages(@Nullable Predicate predicate);
-
-    /**
-     * Save the sink table and job lineage.
-     *
-     * @param entity the data lineage entity
-     */
-    void saveSinkDataLineage(DataLineageEntity entity);
-
-    /**
-     * Get sink data and job lineages.
-     *
-     * @param predicate the predicate for the table lineages
-     * @return the iterator for sink table and job lineages
-     */
-    Iterator<DataLineageEntity> sinkDataLineages(@Nullable Predicate predicate);
-}
diff --git a/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMetaFactory.java b/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMetaFactory.java
deleted file mode 100644
index 11c6d3a1173c7..0000000000000
--- a/paimon-common/src/main/java/org/apache/paimon/lineage/LineageMetaFactory.java
+++ /dev/null
@@ -1,37 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.lineage;
-
-import org.apache.paimon.factories.Factory;
-import org.apache.paimon.options.Options;
-
-import java.io.Serializable;
-
-/** Factory to create {@link LineageMeta}. Each factory should have a unique identifier. */
-public interface LineageMetaFactory extends Factory, Serializable {
-
-    LineageMeta create(LineageMetaContext context);
-
-    /**
-     * Context has all options in a catalog and is used in factory to create {@link LineageMeta}.
-     */
-    interface LineageMetaContext {
-        Options options();
-    }
-}
diff --git a/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntity.java b/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntity.java
deleted file mode 100644
index c4312c4eb080f..0000000000000
--- a/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntity.java
+++ /dev/null
@@ -1,32 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.lineage;
-
-import org.apache.paimon.data.Timestamp;
-
-/** Table lineage entity with database, table and job for table source and sink lineage. */
-public interface TableLineageEntity {
-    String getDatabase();
-
-    String getTable();
-
-    String getJob();
-
-    Timestamp getCreateTime();
-}
diff --git a/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntityImpl.java b/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntityImpl.java
deleted file mode 100644
index ef11ee87f15c9..0000000000000
--- a/paimon-common/src/main/java/org/apache/paimon/lineage/TableLineageEntityImpl.java
+++ /dev/null
@@ -1,56 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.lineage;
-
-import org.apache.paimon.data.Timestamp;
-
-/** Default implementation for {@link TableLineageEntity}. */
-public class TableLineageEntityImpl implements TableLineageEntity {
-    private final String database;
-    private final String table;
-    private final String job;
-    private final Timestamp timestamp;
-
-    public TableLineageEntityImpl(String database, String table, String job, Timestamp timestamp) {
-        this.database = database;
-        this.table = table;
-        this.job = job;
-        this.timestamp = timestamp;
-    }
-
-    @Override
-    public String getDatabase() {
-        return database;
-    }
-
-    @Override
-    public String getTable() {
-        return table;
-    }
-
-    @Override
-    public String getJob() {
-        return job;
-    }
-
-    @Override
-    public Timestamp getCreateTime() {
-        return timestamp;
-    }
-}
diff --git a/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java b/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
index f69af2d599103..bb8cfae682848 100644
--- a/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/options/CatalogOptions.java
@@ -18,8 +18,6 @@
 
 package org.apache.paimon.options;
 
-import org.apache.paimon.options.description.Description;
-import org.apache.paimon.options.description.TextElement;
 import org.apache.paimon.table.CatalogTableType;
 
 import java.time.Duration;
@@ -130,26 +128,6 @@ public class CatalogOptions {
                     .withDescription(
                             "Controls the max number for snapshots per table in the catalog are cached.");
 
-    public static final ConfigOption<String> LINEAGE_META =
-            key("lineage-meta")
-                    .stringType()
-                    .noDefaultValue()
-                    .withDescription(
-                            Description.builder()
-                                    .text(
-                                            "The lineage meta to store table and data lineage information.")
-                                    .linebreak()
-                                    .linebreak()
-                                    .text("Possible values:")
-                                    .linebreak()
-                                    .list(
-                                            TextElement.text(
-                                                    "\"jdbc\": Use standard jdbc to store table and data lineage information."))
-                                    .list(
-                                            TextElement.text(
-                                                    "\"custom\": You can implement LineageMetaFactory and LineageMeta to store lineage information in customized storage."))
-                                    .build());
-
     public static final ConfigOption<Boolean> ALLOW_UPPER_CASE =
             ConfigOptions.key("allow-upper-case")
                     .booleanType()
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index 16b76513d7efd..2b277a29b8359 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -24,7 +24,6 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.FileStatus;
 import org.apache.paimon.fs.Path;
-import org.apache.paimon.lineage.LineageMetaFactory;
 import org.apache.paimon.manifest.PartitionEntry;
 import org.apache.paimon.metastore.MetastoreClient;
 import org.apache.paimon.operation.FileStoreCommit;
@@ -62,7 +61,6 @@
 import static org.apache.paimon.CoreOptions.TYPE;
 import static org.apache.paimon.CoreOptions.createCommitUser;
 import static org.apache.paimon.options.CatalogOptions.ALLOW_UPPER_CASE;
-import static org.apache.paimon.options.CatalogOptions.LINEAGE_META;
 import static org.apache.paimon.options.CatalogOptions.LOCK_ENABLED;
 import static org.apache.paimon.options.CatalogOptions.LOCK_TYPE;
 import static org.apache.paimon.utils.BranchManager.DEFAULT_MAIN_BRANCH;
@@ -76,19 +74,14 @@ public abstract class AbstractCatalog implements Catalog {
     protected final Map<String, String> tableDefaultOptions;
     protected final Options catalogOptions;
 
-    @Nullable protected final LineageMetaFactory lineageMetaFactory;
-
     protected AbstractCatalog(FileIO fileIO) {
         this.fileIO = fileIO;
-        this.lineageMetaFactory = null;
         this.tableDefaultOptions = new HashMap<>();
         this.catalogOptions = new Options();
     }
 
     protected AbstractCatalog(FileIO fileIO, Options options) {
         this.fileIO = fileIO;
-        this.lineageMetaFactory =
-                findAndCreateLineageMeta(options, AbstractCatalog.class.getClassLoader());
         this.tableDefaultOptions = Catalog.tableDefaultOptions(options.toMap());
         this.catalogOptions = options;
     }
@@ -377,27 +370,13 @@ public void alterTable(
     protected abstract void alterTableImpl(Identifier identifier, List<SchemaChange> changes)
             throws TableNotExistException, ColumnAlreadyExistException, ColumnNotExistException;
 
-    @Nullable
-    private LineageMetaFactory findAndCreateLineageMeta(Options options, ClassLoader classLoader) {
-        return options.getOptional(LINEAGE_META)
-                .map(
-                        meta ->
-                                FactoryUtil.discoverFactory(
-                                        classLoader, LineageMetaFactory.class, meta))
-                .orElse(null);
-    }
-
     @Override
     public Table getTable(Identifier identifier) throws TableNotExistException {
         if (isSystemDatabase(identifier.getDatabaseName())) {
             String tableName = identifier.getTableName();
             Table table =
                     SystemTableLoader.loadGlobal(
-                            tableName,
-                            fileIO,
-                            this::allTablePaths,
-                            catalogOptions,
-                            lineageMetaFactory);
+                            tableName, fileIO, this::allTablePaths, catalogOptions);
             if (table == null) {
                 throw new TableNotExistException(identifier);
             }
@@ -444,8 +423,7 @@ protected Table getDataOrFormatTable(Identifier identifier) throws TableNotExist
                                         lockFactory().orElse(null),
                                         lockContext().orElse(null),
                                         identifier),
-                                metastoreClientFactory(identifier, tableMeta.schema).orElse(null),
-                                lineageMetaFactory));
+                                metastoreClientFactory(identifier, tableMeta.schema).orElse(null)));
         CoreOptions options = table.coreOptions();
         if (options.type() == TableType.OBJECT_TABLE) {
             String objectLocation = options.objectLocation();
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java b/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
index 9ff5f9b4f6a83..a722d9e21ada3 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/CatalogEnvironment.java
@@ -19,7 +19,6 @@
 package org.apache.paimon.table;
 
 import org.apache.paimon.catalog.Identifier;
-import org.apache.paimon.lineage.LineageMetaFactory;
 import org.apache.paimon.metastore.MetastoreClient;
 import org.apache.paimon.operation.Lock;
 
@@ -27,10 +26,7 @@
 
 import java.io.Serializable;
 
-/**
- * Catalog environment in table which contains log factory, metastore client factory and lineage
- * meta.
- */
+/** Catalog environment in table which contains log factory, metastore client factory. */
 public class CatalogEnvironment implements Serializable {
 
     private static final long serialVersionUID = 1L;
@@ -39,23 +35,20 @@ public class CatalogEnvironment implements Serializable {
     @Nullable private final String uuid;
     private final Lock.Factory lockFactory;
     @Nullable private final MetastoreClient.Factory metastoreClientFactory;
-    @Nullable private final LineageMetaFactory lineageMetaFactory;
 
     public CatalogEnvironment(
             @Nullable Identifier identifier,
             @Nullable String uuid,
             Lock.Factory lockFactory,
-            @Nullable MetastoreClient.Factory metastoreClientFactory,
-            @Nullable LineageMetaFactory lineageMetaFactory) {
+            @Nullable MetastoreClient.Factory metastoreClientFactory) {
         this.identifier = identifier;
         this.uuid = uuid;
         this.lockFactory = lockFactory;
         this.metastoreClientFactory = metastoreClientFactory;
-        this.lineageMetaFactory = lineageMetaFactory;
     }
 
     public static CatalogEnvironment empty() {
-        return new CatalogEnvironment(null, null, Lock.emptyFactory(), null, null);
+        return new CatalogEnvironment(null, null, Lock.emptyFactory(), null);
     }
 
     @Nullable
@@ -76,9 +69,4 @@ public Lock.Factory lockFactory() {
     public MetastoreClient.Factory metastoreClientFactory() {
         return metastoreClientFactory;
     }
-
-    @Nullable
-    public LineageMetaFactory lineageMetaFactory() {
-        return lineageMetaFactory;
-    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SinkTableLineageTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SinkTableLineageTable.java
deleted file mode 100644
index 71efce0704713..0000000000000
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SinkTableLineageTable.java
+++ /dev/null
@@ -1,64 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.table.system;
-
-import org.apache.paimon.lineage.LineageMeta;
-import org.apache.paimon.lineage.LineageMetaFactory;
-import org.apache.paimon.options.Options;
-import org.apache.paimon.table.Table;
-import org.apache.paimon.table.source.InnerTableRead;
-
-import java.util.Map;
-
-/**
- * This is a system table to display all the sink table lineages.
- *
- * <pre>
- *  For example:
- *     If we select * from sys.sink_table_lineage, we will get
- *     database_name       table_name       job_name      create_time
- *        default            test0            job1    2023-10-22 20:35:12
- *       database1           test1            job1    2023-10-28 21:35:52
- *          ...               ...             ...             ...
- *     We can write sql to fetch the information we need.
- * </pre>
- */
-public class SinkTableLineageTable extends TableLineageTable {
-
-    public static final String SINK_TABLE_LINEAGE = "sink_table_lineage";
-
-    public SinkTableLineageTable(LineageMetaFactory lineageMetaFactory, Options options) {
-        super(lineageMetaFactory, options);
-    }
-
-    @Override
-    public InnerTableRead newRead() {
-        return new TableLineageRead(lineageMetaFactory, options, LineageMeta::sinkTableLineages);
-    }
-
-    @Override
-    public String name() {
-        return SINK_TABLE_LINEAGE;
-    }
-
-    @Override
-    public Table copy(Map<String, String> dynamicOptions) {
-        return new SinkTableLineageTable(lineageMetaFactory, options);
-    }
-}
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SourceTableLineageTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SourceTableLineageTable.java
deleted file mode 100644
index 5d9904fa66754..0000000000000
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SourceTableLineageTable.java
+++ /dev/null
@@ -1,64 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.table.system;
-
-import org.apache.paimon.lineage.LineageMeta;
-import org.apache.paimon.lineage.LineageMetaFactory;
-import org.apache.paimon.options.Options;
-import org.apache.paimon.table.Table;
-import org.apache.paimon.table.source.InnerTableRead;
-
-import java.util.Map;
-
-/**
- * This is a system table to display all the source table lineages.
- *
- * <pre>
- *  For example:
- *     If we select * from sys.source_table_lineage, we will get
- *     database_name       table_name       job_name      create_time
- *        default            test0            job1    2023-10-22 20:35:12
- *       database1           test1            job1    2023-10-28 21:35:52
- *          ...               ...             ...             ...
- *     We can write sql to fetch the information we need.
- * </pre>
- */
-public class SourceTableLineageTable extends TableLineageTable {
-
-    public static final String SOURCE_TABLE_LINEAGE = "source_table_lineage";
-
-    public SourceTableLineageTable(LineageMetaFactory lineageMetaFactory, Options options) {
-        super(lineageMetaFactory, options);
-    }
-
-    @Override
-    public InnerTableRead newRead() {
-        return new TableLineageRead(lineageMetaFactory, options, LineageMeta::sourceTableLineages);
-    }
-
-    @Override
-    public String name() {
-        return SOURCE_TABLE_LINEAGE;
-    }
-
-    @Override
-    public Table copy(Map<String, String> dynamicOptions) {
-        return new SourceTableLineageTable(lineageMetaFactory, options);
-    }
-}
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java b/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
index 3d5b211316ec1..763e4d1216731 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/SystemTableLoader.java
@@ -20,7 +20,6 @@
 
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
-import org.apache.paimon.lineage.LineageMetaFactory;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
@@ -37,7 +36,6 @@
 import java.util.function.Function;
 import java.util.function.Supplier;
 
-import static org.apache.paimon.options.CatalogOptions.LINEAGE_META;
 import static org.apache.paimon.table.system.AggregationFieldsTable.AGGREGATION_FIELDS;
 import static org.apache.paimon.table.system.AllTableOptionsTable.ALL_TABLE_OPTIONS;
 import static org.apache.paimon.table.system.AuditLogTable.AUDIT_LOG;
@@ -52,12 +50,9 @@
 import static org.apache.paimon.table.system.PartitionsTable.PARTITIONS;
 import static org.apache.paimon.table.system.ReadOptimizedTable.READ_OPTIMIZED;
 import static org.apache.paimon.table.system.SchemasTable.SCHEMAS;
-import static org.apache.paimon.table.system.SinkTableLineageTable.SINK_TABLE_LINEAGE;
 import static org.apache.paimon.table.system.SnapshotsTable.SNAPSHOTS;
-import static org.apache.paimon.table.system.SourceTableLineageTable.SOURCE_TABLE_LINEAGE;
 import static org.apache.paimon.table.system.StatisticTable.STATISTICS;
 import static org.apache.paimon.table.system.TagsTable.TAGS;
-import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
 /** Loader to load system {@link Table}s. */
 public class SystemTableLoader {
@@ -95,38 +90,18 @@ public static Table loadGlobal(
             String tableName,
             FileIO fileIO,
             Supplier<Map<String, Map<String, Path>>> allTablePaths,
-            Options catalogOptions,
-            @Nullable LineageMetaFactory lineageMetaFactory) {
+            Options catalogOptions) {
         switch (tableName.toLowerCase()) {
             case ALL_TABLE_OPTIONS:
                 return new AllTableOptionsTable(fileIO, allTablePaths.get());
             case CATALOG_OPTIONS:
                 return new CatalogOptionsTable(catalogOptions);
-            case SOURCE_TABLE_LINEAGE:
-                {
-                    checkNotNull(
-                            lineageMetaFactory,
-                            String.format(
-                                    "Lineage meta should be configured for catalog with %s",
-                                    LINEAGE_META.key()));
-                    return new SourceTableLineageTable(lineageMetaFactory, catalogOptions);
-                }
-            case SINK_TABLE_LINEAGE:
-                {
-                    checkNotNull(
-                            lineageMetaFactory,
-                            String.format(
-                                    "Lineage meta should be configured for catalog with %s",
-                                    LINEAGE_META.key()));
-                    return new SinkTableLineageTable(lineageMetaFactory, catalogOptions);
-                }
             default:
                 return null;
         }
     }
 
     public static List<String> loadGlobalTableNames() {
-        return Arrays.asList(
-                ALL_TABLE_OPTIONS, CATALOG_OPTIONS, SOURCE_TABLE_LINEAGE, SINK_TABLE_LINEAGE);
+        return Arrays.asList(ALL_TABLE_OPTIONS, CATALOG_OPTIONS);
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/TableLineageTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/TableLineageTable.java
deleted file mode 100644
index aeaf3ca3b1330..0000000000000
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/TableLineageTable.java
+++ /dev/null
@@ -1,168 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.table.system;
-
-import org.apache.paimon.data.BinaryString;
-import org.apache.paimon.data.GenericRow;
-import org.apache.paimon.data.InternalRow;
-import org.apache.paimon.disk.IOManager;
-import org.apache.paimon.lineage.LineageMeta;
-import org.apache.paimon.lineage.LineageMetaFactory;
-import org.apache.paimon.lineage.TableLineageEntity;
-import org.apache.paimon.options.Options;
-import org.apache.paimon.predicate.Predicate;
-import org.apache.paimon.reader.RecordReader;
-import org.apache.paimon.table.ReadonlyTable;
-import org.apache.paimon.table.source.InnerTableRead;
-import org.apache.paimon.table.source.InnerTableScan;
-import org.apache.paimon.table.source.ReadOnceTableScan;
-import org.apache.paimon.table.source.Split;
-import org.apache.paimon.table.source.TableRead;
-import org.apache.paimon.types.DataField;
-import org.apache.paimon.types.RowType;
-import org.apache.paimon.types.TimestampType;
-import org.apache.paimon.types.VarCharType;
-import org.apache.paimon.utils.IteratorRecordReader;
-import org.apache.paimon.utils.ProjectedRow;
-
-import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
-
-import javax.annotation.Nullable;
-
-import java.io.IOException;
-import java.util.Arrays;
-import java.util.Collections;
-import java.util.Iterator;
-import java.util.List;
-import java.util.function.BiFunction;
-
-import static org.apache.paimon.utils.Preconditions.checkNotNull;
-
-/** Base lineage table for source and sink table lineage. */
-public abstract class TableLineageTable implements ReadonlyTable {
-    protected final LineageMetaFactory lineageMetaFactory;
-    protected final Options options;
-
-    public static final RowType TABLE_TYPE =
-            new RowType(
-                    Arrays.asList(
-                            new DataField(
-                                    0, "database_name", new VarCharType(VarCharType.MAX_LENGTH)),
-                            new DataField(1, "table_name", new VarCharType(VarCharType.MAX_LENGTH)),
-                            new DataField(2, "job_name", new VarCharType(VarCharType.MAX_LENGTH)),
-                            new DataField(3, "create_time", new TimestampType())));
-
-    protected TableLineageTable(LineageMetaFactory lineageMetaFactory, Options options) {
-        this.lineageMetaFactory = lineageMetaFactory;
-        this.options = options;
-    }
-
-    @Override
-    public InnerTableScan newScan() {
-        return new ReadOnceTableScan() {
-            @Override
-            public InnerTableScan withFilter(Predicate predicate) {
-                return this;
-            }
-
-            @Override
-            protected Plan innerPlan() {
-                /// TODO get the real row count for plan.
-                return () -> Collections.singletonList((Split) () -> 1L);
-            }
-        };
-    }
-
-    @Override
-    public RowType rowType() {
-        return TABLE_TYPE;
-    }
-
-    @Override
-    public List<String> primaryKeys() {
-        return Arrays.asList("database_name", "table_name", "job_name");
-    }
-
-    /** Table lineage read with lineage meta query. */
-    protected static class TableLineageRead implements InnerTableRead {
-        private final LineageMetaFactory lineageMetaFactory;
-        private final Options options;
-        private final BiFunction<LineageMeta, Predicate, Iterator<TableLineageEntity>>
-                tableLineageQuery;
-        @Nullable private Predicate predicate;
-        private RowType readType;
-
-        protected TableLineageRead(
-                LineageMetaFactory lineageMetaFactory,
-                Options options,
-                BiFunction<LineageMeta, Predicate, Iterator<TableLineageEntity>>
-                        tableLineageQuery) {
-            this.lineageMetaFactory = lineageMetaFactory;
-            this.options = options;
-            this.tableLineageQuery = tableLineageQuery;
-            this.predicate = null;
-        }
-
-        @Override
-        public InnerTableRead withFilter(Predicate predicate) {
-            this.predicate = predicate;
-            return this;
-        }
-
-        @Override
-        public InnerTableRead withReadType(RowType readType) {
-            this.readType = readType;
-            return this;
-        }
-
-        @Override
-        public TableRead withIOManager(IOManager ioManager) {
-            return this;
-        }
-
-        @Override
-        public RecordReader<InternalRow> createReader(Split split) throws IOException {
-            try (LineageMeta lineageMeta = lineageMetaFactory.create(() -> options)) {
-                Iterator<TableLineageEntity> sourceTableLineages =
-                        tableLineageQuery.apply(lineageMeta, predicate);
-                return new IteratorRecordReader<>(
-                        Iterators.transform(
-                                sourceTableLineages,
-                                entity -> {
-                                    checkNotNull(entity);
-                                    GenericRow row =
-                                            GenericRow.of(
-                                                    BinaryString.fromString(entity.getDatabase()),
-                                                    BinaryString.fromString(entity.getTable()),
-                                                    BinaryString.fromString(entity.getJob()),
-                                                    entity.getCreateTime());
-                                    if (readType != null) {
-                                        return ProjectedRow.from(
-                                                        readType, TableLineageTable.TABLE_TYPE)
-                                                .replaceRow(row);
-                                    } else {
-                                        return row;
-                                    }
-                                }));
-            } catch (Exception e) {
-                throw new RuntimeException(e);
-            }
-        }
-    }
-}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/AbstractFlinkTableFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/AbstractFlinkTableFactory.java
index 9f90a2cd01304..6b10dbb84bf46 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/AbstractFlinkTableFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/AbstractFlinkTableFactory.java
@@ -25,15 +25,10 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.CatalogContext;
 import org.apache.paimon.catalog.Identifier;
-import org.apache.paimon.data.Timestamp;
 import org.apache.paimon.flink.log.LogStoreTableFactory;
 import org.apache.paimon.flink.sink.FlinkTableSink;
 import org.apache.paimon.flink.source.DataTableSource;
 import org.apache.paimon.flink.source.SystemTableSource;
-import org.apache.paimon.lineage.LineageMeta;
-import org.apache.paimon.lineage.LineageMetaFactory;
-import org.apache.paimon.lineage.TableLineageEntity;
-import org.apache.paimon.lineage.TableLineageEntityImpl;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.options.OptionsUtils;
 import org.apache.paimon.schema.Schema;
@@ -47,7 +42,6 @@
 import org.apache.flink.configuration.ConfigOption;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.configuration.ExecutionOptions;
-import org.apache.flink.configuration.PipelineOptions;
 import org.apache.flink.configuration.ReadableConfig;
 import org.apache.flink.table.api.TableConfig;
 import org.apache.flink.table.api.ValidationException;
@@ -71,7 +65,6 @@
 import java.util.Objects;
 import java.util.Optional;
 import java.util.Set;
-import java.util.function.BiConsumer;
 import java.util.regex.Pattern;
 
 import static org.apache.paimon.CoreOptions.LOG_CHANGELOG_MODE;
@@ -109,23 +102,9 @@ public DynamicTableSource createDynamicTableSource(Context context) {
                     isStreamingMode,
                     context.getObjectIdentifier());
         } else {
-            Table table = buildPaimonTable(context);
-            if (table instanceof FileStoreTable) {
-                storeTableLineage(
-                        ((FileStoreTable) table).catalogEnvironment().lineageMetaFactory(),
-                        context,
-                        (entity, lineageFactory) -> {
-                            try (LineageMeta lineage =
-                                    lineageFactory.create(() -> Options.fromMap(table.options()))) {
-                                lineage.saveSourceTableLineage(entity);
-                            } catch (Exception e) {
-                                throw new RuntimeException(e);
-                            }
-                        });
-            }
             return new DataTableSource(
                     context.getObjectIdentifier(),
-                    table,
+                    buildPaimonTable(context),
                     isStreamingMode,
                     context,
                     createOptionalLogStoreFactory(context).orElse(null));
@@ -134,46 +113,13 @@ public DynamicTableSource createDynamicTableSource(Context context) {
 
     @Override
     public DynamicTableSink createDynamicTableSink(Context context) {
-        Table table = buildPaimonTable(context);
-        if (table instanceof FileStoreTable) {
-            storeTableLineage(
-                    ((FileStoreTable) table).catalogEnvironment().lineageMetaFactory(),
-                    context,
-                    (entity, lineageFactory) -> {
-                        try (LineageMeta lineage =
-                                lineageFactory.create(() -> Options.fromMap(table.options()))) {
-                            lineage.saveSinkTableLineage(entity);
-                        } catch (Exception e) {
-                            throw new RuntimeException(e);
-                        }
-                    });
-        }
         return new FlinkTableSink(
                 context.getObjectIdentifier(),
-                table,
+                buildPaimonTable(context),
                 context,
                 createOptionalLogStoreFactory(context).orElse(null));
     }
 
-    private void storeTableLineage(
-            @Nullable LineageMetaFactory lineageMetaFactory,
-            Context context,
-            BiConsumer<TableLineageEntity, LineageMetaFactory> tableLineage) {
-        if (lineageMetaFactory != null) {
-            String pipelineName = context.getConfiguration().get(PipelineOptions.NAME);
-            if (pipelineName == null) {
-                throw new ValidationException("Cannot get pipeline name for lineage meta.");
-            }
-            tableLineage.accept(
-                    new TableLineageEntityImpl(
-                            context.getObjectIdentifier().getDatabaseName(),
-                            context.getObjectIdentifier().getObjectName(),
-                            pipelineName,
-                            Timestamp.fromEpochMillis(System.currentTimeMillis())),
-                    lineageMetaFactory);
-        }
-    }
-
     @Override
     public Set<ConfigOption<?>> requiredOptions() {
         return Collections.emptySet();
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
index 96334de3f87b5..10b03b7139ae3 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/CatalogTableITCase.java
@@ -21,8 +21,6 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.table.system.AllTableOptionsTable;
 import org.apache.paimon.table.system.CatalogOptionsTable;
-import org.apache.paimon.table.system.SinkTableLineageTable;
-import org.apache.paimon.table.system.SourceTableLineageTable;
 import org.apache.paimon.utils.BlockingIterator;
 
 import org.apache.commons.lang3.StringUtils;
@@ -200,9 +198,7 @@ public void testSystemDatabase() {
         assertThat(sql("SHOW TABLES"))
                 .containsExactlyInAnyOrder(
                         Row.of(AllTableOptionsTable.ALL_TABLE_OPTIONS),
-                        Row.of(CatalogOptionsTable.CATALOG_OPTIONS),
-                        Row.of(SourceTableLineageTable.SOURCE_TABLE_LINEAGE),
-                        Row.of(SinkTableLineageTable.SINK_TABLE_LINEAGE));
+                        Row.of(CatalogOptionsTable.CATALOG_OPTIONS));
     }
 
     @Test
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkLineageITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkLineageITCase.java
deleted file mode 100644
index 5b61d5272f80e..0000000000000
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkLineageITCase.java
+++ /dev/null
@@ -1,206 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.flink;
-
-import org.apache.paimon.lineage.DataLineageEntity;
-import org.apache.paimon.lineage.LineageMeta;
-import org.apache.paimon.lineage.LineageMetaFactory;
-import org.apache.paimon.lineage.TableLineageEntity;
-import org.apache.paimon.predicate.Predicate;
-
-import org.apache.flink.configuration.PipelineOptions;
-import org.apache.flink.table.api.ValidationException;
-import org.apache.flink.types.Row;
-import org.apache.flink.util.CloseableIterator;
-import org.junit.jupiter.api.Test;
-
-import javax.annotation.Nullable;
-
-import java.util.ArrayList;
-import java.util.Collections;
-import java.util.HashMap;
-import java.util.Iterator;
-import java.util.List;
-import java.util.Map;
-
-import static org.apache.paimon.options.CatalogOptions.LINEAGE_META;
-import static org.assertj.core.api.Assertions.assertThat;
-import static org.assertj.core.api.Assertions.assertThatThrownBy;
-
-/** ITCase for flink table and data lineage. */
-public class FlinkLineageITCase extends CatalogITCaseBase {
-    private static final String THROWING_META = "throwing-meta";
-    private static final Map<String, Map<String, TableLineageEntity>> jobSourceTableLineages =
-            new HashMap<>();
-    private static final Map<String, Map<String, TableLineageEntity>> jobSinkTableLineages =
-            new HashMap<>();
-
-    @Override
-    protected List<String> ddl() {
-        return Collections.singletonList("CREATE TABLE IF NOT EXISTS T (a INT, b INT, c INT)");
-    }
-
-    @Override
-    protected Map<String, String> catalogOptions() {
-        return Collections.singletonMap(LINEAGE_META.key(), THROWING_META);
-    }
-
-    @Test
-    public void testTableLineage() throws Exception {
-        // Validate for source and sink lineage when pipeline name is null
-        assertThatThrownBy(
-                        () -> tEnv.executeSql("INSERT INTO T VALUES (1, 2, 3),(4, 5, 6);").await())
-                .hasCauseExactlyInstanceOf(ValidationException.class)
-                .hasRootCauseMessage("Cannot get pipeline name for lineage meta.");
-        assertThatThrownBy(() -> tEnv.executeSql("SELECT * FROM T").collect().close())
-                .hasCauseExactlyInstanceOf(ValidationException.class)
-                .hasRootCauseMessage("Cannot get pipeline name for lineage meta.");
-
-        // Call storeSinkTableLineage and storeSourceTableLineage methods
-        tEnv.getConfig().getConfiguration().set(PipelineOptions.NAME, "insert_t_job");
-        tEnv.executeSql("INSERT INTO T VALUES (1, 2, 3),(4, 5, 6);").await();
-        assertThat(jobSinkTableLineages).isNotEmpty();
-        TableLineageEntity sinkTableLineage =
-                jobSinkTableLineages.get("insert_t_job").get("default.T.insert_t_job");
-        assertThat(sinkTableLineage.getTable()).isEqualTo("T");
-
-        List<Row> sinkTableRows = new ArrayList<>();
-        try (CloseableIterator<Row> iterator =
-                tEnv.executeSql("SELECT * FROM sys.sink_table_lineage").collect()) {
-            while (iterator.hasNext()) {
-                sinkTableRows.add(iterator.next());
-            }
-        }
-        assertThat(sinkTableRows.size()).isEqualTo(1);
-        Row sinkTableRow = sinkTableRows.get(0);
-        assertThat(sinkTableRow.getField("database_name")).isEqualTo("default");
-        assertThat(sinkTableRow.getField("table_name")).isEqualTo("T");
-        assertThat(sinkTableRow.getField("job_name")).isEqualTo("insert_t_job");
-
-        tEnv.getConfig().getConfiguration().set(PipelineOptions.NAME, "select_t_job");
-        tEnv.executeSql("SELECT * FROM T").collect().close();
-        assertThat(jobSourceTableLineages).isNotEmpty();
-        TableLineageEntity sourceTableLineage =
-                jobSourceTableLineages.get("select_t_job").get("default.T.select_t_job");
-        assertThat(sourceTableLineage.getTable()).isEqualTo("T");
-
-        List<Row> sourceTableRows = new ArrayList<>();
-        try (CloseableIterator<Row> iterator =
-                tEnv.executeSql("SELECT * FROM sys.source_table_lineage").collect()) {
-            while (iterator.hasNext()) {
-                sourceTableRows.add(iterator.next());
-            }
-        }
-        assertThat(sourceTableRows.size()).isEqualTo(1);
-        Row sourceTableRow = sourceTableRows.get(0);
-        assertThat(sourceTableRow.getField("database_name")).isEqualTo("default");
-        assertThat(sourceTableRow.getField("table_name")).isEqualTo("T");
-        assertThat(sourceTableRow.getField("job_name")).isEqualTo("select_t_job");
-    }
-
-    private static String getTableLineageKey(TableLineageEntity entity) {
-        return String.format("%s.%s.%s", entity.getDatabase(), entity.getTable(), entity.getJob());
-    }
-
-    /** Factory to create throwing lineage meta. */
-    public static class TestingMemoryLineageMetaFactory implements LineageMetaFactory {
-        private static final long serialVersionUID = 1L;
-
-        @Override
-        public String identifier() {
-            return THROWING_META;
-        }
-
-        @Override
-        public LineageMeta create(LineageMetaContext context) {
-            return new TestingMemoryLineageMeta();
-        }
-    }
-
-    /** Throwing specific exception in each method. */
-    private static class TestingMemoryLineageMeta implements LineageMeta {
-
-        @Override
-        public void saveSourceTableLineage(TableLineageEntity entity) {
-            jobSourceTableLineages
-                    .computeIfAbsent(entity.getJob(), key -> new HashMap<>())
-                    .put(getTableLineageKey(entity), entity);
-        }
-
-        @Override
-        public void deleteSourceTableLineage(String job) {
-            jobSourceTableLineages.remove(job);
-        }
-
-        @Override
-        public Iterator<TableLineageEntity> sourceTableLineages(@Nullable Predicate predicate) {
-            return jobSourceTableLineages.values().stream()
-                    .flatMap(v -> v.values().stream())
-                    .iterator();
-        }
-
-        @Override
-        public void saveSinkTableLineage(TableLineageEntity entity) {
-            assertThat(entity.getJob()).isEqualTo("insert_t_job");
-            assertThat(entity.getTable()).isEqualTo("T");
-            assertThat(entity.getDatabase()).isEqualTo("default");
-            jobSinkTableLineages
-                    .computeIfAbsent(entity.getJob(), key -> new HashMap<>())
-                    .put(getTableLineageKey(entity), entity);
-        }
-
-        @Override
-        public Iterator<TableLineageEntity> sinkTableLineages(@Nullable Predicate predicate) {
-            return jobSinkTableLineages.values().stream()
-                    .flatMap(v -> v.values().stream())
-                    .iterator();
-        }
-
-        @Override
-        public void deleteSinkTableLineage(String job) {
-            jobSinkTableLineages.remove(job);
-        }
-
-        @Override
-        public void saveSourceDataLineage(DataLineageEntity entity) {
-            assertThat(entity.getJob()).isEqualTo("select_t_job");
-            assertThat(entity.getTable()).isEqualTo("T");
-            assertThat(entity.getDatabase()).isEqualTo("default");
-            throw new UnsupportedOperationException("Method saveSinkTableLineage is not supported");
-        }
-
-        @Override
-        public Iterator<DataLineageEntity> sourceDataLineages(@Nullable Predicate predicate) {
-            throw new UnsupportedOperationException();
-        }
-
-        @Override
-        public void saveSinkDataLineage(DataLineageEntity entity) {
-            throw new UnsupportedOperationException();
-        }
-
-        @Override
-        public Iterator<DataLineageEntity> sinkDataLineages(@Nullable Predicate predicate) {
-            throw new UnsupportedOperationException();
-        }
-
-        @Override
-        public void close() throws Exception {}
-    }
-}
diff --git a/paimon-flink/paimon-flink-common/src/test/resources/META-INF/services/org.apache.paimon.factories.Factory b/paimon-flink/paimon-flink-common/src/test/resources/META-INF/services/org.apache.paimon.factories.Factory
index fcb6fe982943f..3c05b5fba3ec9 100644
--- a/paimon-flink/paimon-flink-common/src/test/resources/META-INF/services/org.apache.paimon.factories.Factory
+++ b/paimon-flink/paimon-flink-common/src/test/resources/META-INF/services/org.apache.paimon.factories.Factory
@@ -15,8 +15,5 @@
 
 org.apache.paimon.flink.FlinkCatalogTest$TestingLogSoreRegisterFactory
 
-# Lineage meta factory
-org.apache.paimon.flink.FlinkLineageITCase$TestingMemoryLineageMetaFactory
-
 # Catalog lock factory
 org.apache.paimon.flink.FileSystemCatalogITCase$FileSystemCatalogDummyLockFactory
\ No newline at end of file
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 9a90995f282d2..5157e606006ca 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -610,8 +610,7 @@ public org.apache.paimon.table.Table getDataOrFormatTable(Identifier identifier)
                                     lockFactory().orElse(null),
                                     lockContext().orElse(null),
                                     identifier),
-                            metastoreClientFactory(identifier, tableMeta.schema()).orElse(null),
-                            lineageMetaFactory));
+                            metastoreClientFactory(identifier, tableMeta.schema()).orElse(null)));
         } catch (TableNotExistException ignore) {
         }
 

From 4c6c557e6fd70e9ab9e5ebd4292f80340e5803ed Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Sun, 1 Dec 2024 19:38:54 +0800
Subject: [PATCH 083/157] [flink] Avoid deprecated SetupableStreamOperator
 (#4591)

---
 .../flink/sink/cdc/CdcDynamicBucketSink.java  |   8 +-
 .../cdc/CdcDynamicBucketWriteOperator.java    |  35 ++-
 .../flink/sink/cdc/CdcFixedBucketSink.java    |   6 +-
 .../cdc/CdcRecordStoreMultiWriteOperator.java |  46 +++-
 .../sink/cdc/CdcRecordStoreWriteOperator.java |  35 ++-
 .../flink/sink/cdc/CdcUnawareBucketSink.java  |   6 +-
 .../cdc/CdcUnawareBucketWriteOperator.java    |  35 ++-
 .../sink/cdc/FlinkCdcMultiTableSink.java      |  17 +-
 .../cdc/FlinkCdcSyncDatabaseSinkBuilder.java  |   4 +-
 .../CdcRecordStoreMultiWriteOperatorTest.java |   6 +-
 .../cdc/CdcRecordStoreWriteOperatorTest.java  |   6 +-
 .../sink/cdc/FlinkCdcMultiTableSinkTest.java  |   1 -
 .../AppendBypassCompactWorkerOperator.java    |  35 ++-
 .../sink/AppendCompactWorkerOperator.java     |  22 +-
 ...nlyMultiTableCompactionWorkerOperator.java |  42 +++-
 ...lySingleTableCompactionWorkerOperator.java |  34 ++-
 .../AutoTagForSavepointCommitterOperator.java |  24 +--
 ...gForSavepointCommitterOperatorFactory.java |  94 ++++++++
 .../sink/BatchWriteGeneratorTagOperator.java  |  24 +--
 ...BatchWriteGeneratorTagOperatorFactory.java |  60 ++++++
 .../sink/CombinedTableCompactorSink.java      |  14 +-
 .../paimon/flink/sink/CommitterOperator.java  |  26 +--
 .../flink/sink/CommitterOperatorFactory.java  | 115 ++++++++++
 .../paimon/flink/sink/CompactorSink.java      |   6 +-
 .../sink/DynamicBucketRowWriteOperator.java   |  34 ++-
 .../paimon/flink/sink/FixedBucketSink.java    |   7 +-
 .../apache/paimon/flink/sink/FlinkSink.java   |  24 ++-
 .../paimon/flink/sink/FlinkSinkBuilder.java   |   2 +-
 .../paimon/flink/sink/LocalMergeOperator.java |  34 ++-
 .../sink/MultiTablesStoreCompactOperator.java |  58 ++++-
 .../flink/sink/PrepareCommitOperator.java     |  19 +-
 .../flink/sink/RewriteFileIndexSink.java      |  56 +++--
 .../flink/sink/RowDataStoreWriteOperator.java |  53 +++--
 .../flink/sink/RowDynamicBucketSink.java      |   8 +-
 .../flink/sink/RowUnawareBucketSink.java      |  46 ++--
 .../flink/sink/StoreCompactOperator.java      |  50 ++++-
 .../paimon/flink/sink/TableWriteOperator.java |  23 +-
 .../sink/UnawareBucketCompactionSink.java     |   8 +-
 .../paimon/flink/sink/UnawareBucketSink.java  |   5 +-
 .../sink/index/GlobalDynamicBucketSink.java   |  11 +-
 .../sink/index/IndexBootstrapOperator.java    |  39 +++-
 .../AppendBypassCoordinateOperator.java       |   8 +-
 ...AppendBypassCoordinateOperatorFactory.java |   6 +-
 ...ultiTableCompactionWorkerOperatorTest.java |  19 +-
 ...ngleTableCompactionWorkerOperatorTest.java |  28 ++-
 ...oTagForSavepointCommitterOperatorTest.java |  35 +--
 .../BatchWriteGeneratorTagOperatorTest.java   |  39 +++-
 .../flink/sink/CommitterOperatorTest.java     | 110 ++++++----
 .../flink/sink/CompactorSinkITCase.java       |   8 +-
 .../paimon/flink/sink/FlinkSinkTest.java      |  18 +-
 .../flink/sink/LocalMergeOperatorTest.java    |  18 +-
 .../flink/sink/StoreCompactOperatorTest.java  |   8 +-
 .../flink/sink/StoreMultiCommitterTest.java   |  15 +-
 .../sink/WriterChainingStrategyTest.java      | 203 ++++++++++++++++++
 .../paimon/flink/sink/WriterOperatorTest.java |  45 ++--
 55 files changed, 1397 insertions(+), 341 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorFactory.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorFactory.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperatorFactory.java
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java

diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketSink.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketSink.java
index 574ff685f3fa4..6d9e3a4a7c82f 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketSink.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketSink.java
@@ -25,7 +25,7 @@
 import org.apache.paimon.table.sink.KeyAndBucketExtractor;
 
 import org.apache.flink.api.java.tuple.Tuple2;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 /** {@link CdcDynamicBucketSinkBase} for {@link CdcRecord}. */
 public class CdcDynamicBucketSink extends CdcDynamicBucketSinkBase<CdcRecord> {
@@ -42,8 +42,8 @@ protected KeyAndBucketExtractor<CdcRecord> createExtractor(TableSchema schema) {
     }
 
     @Override
-    protected OneInputStreamOperator<Tuple2<CdcRecord, Integer>, Committable> createWriteOperator(
-            StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new CdcDynamicBucketWriteOperator(table, writeProvider, commitUser);
+    protected OneInputStreamOperatorFactory<Tuple2<CdcRecord, Integer>, Committable>
+            createWriteOperatorFactory(StoreSinkWrite.Provider writeProvider, String commitUser) {
+        return new CdcDynamicBucketWriteOperator.Factory(table, writeProvider, commitUser);
     }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketWriteOperator.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketWriteOperator.java
index b2fbdc3e93eef..b0b135b3610bb 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketWriteOperator.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcDynamicBucketWriteOperator.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.flink.sink.cdc;
 
 import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.flink.sink.Committable;
 import org.apache.paimon.flink.sink.PrepareCommitOperator;
 import org.apache.paimon.flink.sink.StoreSinkWrite;
 import org.apache.paimon.flink.sink.TableWriteOperator;
@@ -26,6 +27,9 @@
 
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.runtime.state.StateInitializationContext;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 import java.io.IOException;
@@ -43,11 +47,12 @@ public class CdcDynamicBucketWriteOperator extends TableWriteOperator<Tuple2<Cdc
 
     private final long retrySleepMillis;
 
-    public CdcDynamicBucketWriteOperator(
+    private CdcDynamicBucketWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(table, storeSinkWriteProvider, initialCommitUser);
+        super(parameters, table, storeSinkWriteProvider, initialCommitUser);
         this.retrySleepMillis =
                 table.coreOptions().toConfiguration().get(RETRY_SLEEP_TIME).toMillis();
     }
@@ -85,4 +90,30 @@ public void processElement(StreamRecord<Tuple2<CdcRecord, Integer>> element) thr
             throw new IOException(e);
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link CdcDynamicBucketWriteOperator}. */
+    public static class Factory extends TableWriteOperator.Factory<Tuple2<CdcRecord, Integer>> {
+
+        public Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new CdcDynamicBucketWriteOperator(
+                            parameters, table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return CdcDynamicBucketWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcFixedBucketSink.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcFixedBucketSink.java
index 59bdb192beea7..bec9508888b4c 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcFixedBucketSink.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcFixedBucketSink.java
@@ -24,7 +24,7 @@
 import org.apache.paimon.flink.sink.StoreSinkWrite;
 import org.apache.paimon.table.FileStoreTable;
 
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 /**
  * A {@link FlinkSink} for fixed-bucket table which accepts {@link CdcRecord} and waits for a schema
@@ -39,8 +39,8 @@ public CdcFixedBucketSink(FileStoreTable table) {
     }
 
     @Override
-    protected OneInputStreamOperator<CdcRecord, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<CdcRecord, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new CdcRecordStoreWriteOperator(table, writeProvider, commitUser);
+        return new CdcRecordStoreWriteOperator.Factory(table, writeProvider, commitUser);
     }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperator.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperator.java
index 7d72fe3e801f9..5db111a300474 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperator.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperator.java
@@ -38,6 +38,9 @@
 
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.runtime.state.StateSnapshotContext;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 import java.io.IOException;
@@ -74,12 +77,13 @@ public class CdcRecordStoreMultiWriteOperator
     private String commitUser;
     private ExecutorService compactExecutor;
 
-    public CdcRecordStoreMultiWriteOperator(
+    private CdcRecordStoreMultiWriteOperator(
+            StreamOperatorParameters<MultiTableCommittable> parameters,
             Catalog.Loader catalogLoader,
             StoreSinkWrite.WithWriteBufferProvider storeSinkWriteProvider,
             String initialCommitUser,
             Options options) {
-        super(options);
+        super(parameters, options);
         this.catalogLoader = catalogLoader;
         this.storeSinkWriteProvider = storeSinkWriteProvider;
         this.initialCommitUser = initialCommitUser;
@@ -254,4 +258,42 @@ public Map<Identifier, StoreSinkWrite> writes() {
     public String commitUser() {
         return commitUser;
     }
+
+    /** {@link StreamOperatorFactory} of {@link CdcRecordStoreMultiWriteOperator}. */
+    public static class Factory
+            extends PrepareCommitOperator.Factory<CdcMultiplexRecord, MultiTableCommittable> {
+        private final StoreSinkWrite.WithWriteBufferProvider storeSinkWriteProvider;
+        private final String initialCommitUser;
+        private final Catalog.Loader catalogLoader;
+
+        public Factory(
+                Catalog.Loader catalogLoader,
+                StoreSinkWrite.WithWriteBufferProvider storeSinkWriteProvider,
+                String initialCommitUser,
+                Options options) {
+            super(options);
+            this.catalogLoader = catalogLoader;
+            this.storeSinkWriteProvider = storeSinkWriteProvider;
+            this.initialCommitUser = initialCommitUser;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<MultiTableCommittable>> T createStreamOperator(
+                StreamOperatorParameters<MultiTableCommittable> parameters) {
+            return (T)
+                    new CdcRecordStoreMultiWriteOperator(
+                            parameters,
+                            catalogLoader,
+                            storeSinkWriteProvider,
+                            initialCommitUser,
+                            options);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return CdcRecordStoreMultiWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperator.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperator.java
index dd0aa2e5622c2..195e683daaf6f 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperator.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperator.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.flink.sink.cdc;
 
 import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.flink.sink.Committable;
 import org.apache.paimon.flink.sink.PrepareCommitOperator;
 import org.apache.paimon.flink.sink.StoreSinkWrite;
 import org.apache.paimon.flink.sink.TableWriteOperator;
@@ -27,6 +28,9 @@
 import org.apache.paimon.table.FileStoreTable;
 
 import org.apache.flink.runtime.state.StateInitializationContext;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 import java.io.IOException;
@@ -50,11 +54,12 @@ public class CdcRecordStoreWriteOperator extends TableWriteOperator<CdcRecord> {
 
     private final long retrySleepMillis;
 
-    public CdcRecordStoreWriteOperator(
+    protected CdcRecordStoreWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(table, storeSinkWriteProvider, initialCommitUser);
+        super(parameters, table, storeSinkWriteProvider, initialCommitUser);
         this.retrySleepMillis =
                 table.coreOptions().toConfiguration().get(RETRY_SLEEP_TIME).toMillis();
     }
@@ -92,4 +97,30 @@ public void processElement(StreamRecord<CdcRecord> element) throws Exception {
             throw new IOException(e);
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link CdcRecordStoreWriteOperator}. */
+    public static class Factory extends TableWriteOperator.Factory<CdcRecord> {
+
+        public Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new CdcRecordStoreWriteOperator(
+                            parameters, table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return CdcRecordStoreWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketSink.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketSink.java
index 313f4d013ef89..820ef7728f8ce 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketSink.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketSink.java
@@ -24,7 +24,7 @@
 import org.apache.paimon.table.FileStoreTable;
 
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
 
@@ -42,9 +42,9 @@ public CdcUnawareBucketSink(FileStoreTable table, Integer parallelism) {
     }
 
     @Override
-    protected OneInputStreamOperator<CdcRecord, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<CdcRecord, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new CdcUnawareBucketWriteOperator(table, writeProvider, commitUser);
+        return new CdcUnawareBucketWriteOperator.Factory(table, writeProvider, commitUser);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketWriteOperator.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketWriteOperator.java
index c57a40f3f71da..26f65fdd09ce2 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketWriteOperator.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/CdcUnawareBucketWriteOperator.java
@@ -18,21 +18,26 @@
 
 package org.apache.paimon.flink.sink.cdc;
 
+import org.apache.paimon.flink.sink.Committable;
 import org.apache.paimon.flink.sink.PrepareCommitOperator;
 import org.apache.paimon.flink.sink.StoreSinkWrite;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.types.RowKind;
 
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 /** A {@link PrepareCommitOperator} to write {@link CdcRecord} to unaware-bucket mode table. */
 public class CdcUnawareBucketWriteOperator extends CdcRecordStoreWriteOperator {
 
-    public CdcUnawareBucketWriteOperator(
+    private CdcUnawareBucketWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(table, storeSinkWriteProvider, initialCommitUser);
+        super(parameters, table, storeSinkWriteProvider, initialCommitUser);
     }
 
     @Override
@@ -42,4 +47,30 @@ public void processElement(StreamRecord<CdcRecord> element) throws Exception {
             super.processElement(element);
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link CdcUnawareBucketWriteOperator}. */
+    public static class Factory extends CdcRecordStoreWriteOperator.Factory {
+
+        public Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new CdcUnawareBucketWriteOperator(
+                            parameters, table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return CdcUnawareBucketWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
index 55e987c6055fa..f9b7bbc6b9105 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.flink.sink.CommittableStateManager;
 import org.apache.paimon.flink.sink.Committer;
-import org.apache.paimon.flink.sink.CommitterOperator;
+import org.apache.paimon.flink.sink.CommitterOperatorFactory;
 import org.apache.paimon.flink.sink.FlinkSink;
 import org.apache.paimon.flink.sink.FlinkStreamPartitioner;
 import org.apache.paimon.flink.sink.MultiTableCommittable;
@@ -41,7 +41,7 @@
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
 
@@ -63,19 +63,16 @@ public class FlinkCdcMultiTableSink implements Serializable {
     private final Catalog.Loader catalogLoader;
     private final double commitCpuCores;
     @Nullable private final MemorySize commitHeapMemory;
-    private final boolean commitChaining;
     private final String commitUser;
 
     public FlinkCdcMultiTableSink(
             Catalog.Loader catalogLoader,
             double commitCpuCores,
             @Nullable MemorySize commitHeapMemory,
-            boolean commitChaining,
             String commitUser) {
         this.catalogLoader = catalogLoader;
         this.commitCpuCores = commitCpuCores;
         this.commitHeapMemory = commitHeapMemory;
-        this.commitChaining = commitChaining;
         this.commitUser = commitUser;
     }
 
@@ -129,10 +126,9 @@ public DataStreamSink<?> sinkFrom(
                         .transform(
                                 GLOBAL_COMMITTER_NAME,
                                 typeInfo,
-                                new CommitterOperator<>(
+                                new CommitterOperatorFactory<>(
                                         true,
                                         false,
-                                        commitChaining,
                                         commitUser,
                                         createCommitterFactory(),
                                         createCommittableStateManager()))
@@ -141,9 +137,10 @@ public DataStreamSink<?> sinkFrom(
         return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
-    protected OneInputStreamOperator<CdcMultiplexRecord, MultiTableCommittable> createWriteOperator(
-            StoreSinkWrite.WithWriteBufferProvider writeProvider, String commitUser) {
-        return new CdcRecordStoreMultiWriteOperator(
+    protected OneInputStreamOperatorFactory<CdcMultiplexRecord, MultiTableCommittable>
+            createWriteOperator(
+                    StoreSinkWrite.WithWriteBufferProvider writeProvider, String commitUser) {
+        return new CdcRecordStoreMultiWriteOperator.Factory(
                 catalogLoader, writeProvider, commitUser, new Options());
     }
 
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkBuilder.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkBuilder.java
index ed8fdd113389a..a9ad66847b4b5 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkBuilder.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkBuilder.java
@@ -66,7 +66,6 @@ public class FlinkCdcSyncDatabaseSinkBuilder<T> {
     @Nullable private Integer parallelism;
     private double committerCpu;
     @Nullable private MemorySize committerMemory;
-    private boolean commitChaining;
 
     // Paimon catalog used to check and create tables. There will be two
     //     places where this catalog is used. 1) in processing function,
@@ -103,7 +102,6 @@ public FlinkCdcSyncDatabaseSinkBuilder<T> withTableOptions(Options options) {
         this.parallelism = options.get(FlinkConnectorOptions.SINK_PARALLELISM);
         this.committerCpu = options.get(FlinkConnectorOptions.SINK_COMMITTER_CPU);
         this.committerMemory = options.get(FlinkConnectorOptions.SINK_COMMITTER_MEMORY);
-        this.commitChaining = options.get(FlinkConnectorOptions.SINK_COMMITTER_OPERATOR_CHAINING);
         this.commitUser = createCommitUser(options);
         return this;
     }
@@ -169,7 +167,7 @@ private void buildCombinedCdcSink() {
 
         FlinkCdcMultiTableSink sink =
                 new FlinkCdcMultiTableSink(
-                        catalogLoader, committerCpu, committerMemory, commitChaining, commitUser);
+                        catalogLoader, committerCpu, committerMemory, commitUser);
         sink.sinkFrom(partitioned);
     }
 
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperatorTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperatorTest.java
index 8c78ab853a60a..9f35b25026bbb 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperatorTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreMultiWriteOperatorTest.java
@@ -689,8 +689,8 @@ public void testUsingTheSameCompactExecutor() throws Exception {
 
     private OneInputStreamOperatorTestHarness<CdcMultiplexRecord, MultiTableCommittable>
             createTestHarness(Catalog.Loader catalogLoader) throws Exception {
-        CdcRecordStoreMultiWriteOperator operator =
-                new CdcRecordStoreMultiWriteOperator(
+        CdcRecordStoreMultiWriteOperator.Factory operatorFactory =
+                new CdcRecordStoreMultiWriteOperator.Factory(
                         catalogLoader,
                         (t, commitUser, state, ioManager, memoryPoolFactory, metricGroup) ->
                                 new StoreSinkWriteImpl(
@@ -709,7 +709,7 @@ public void testUsingTheSameCompactExecutor() throws Exception {
         TypeSerializer<MultiTableCommittable> outputSerializer =
                 new MultiTableCommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<CdcMultiplexRecord, MultiTableCommittable> harness =
-                new OneInputStreamOperatorTestHarness<>(operator, inputSerializer);
+                new OneInputStreamOperatorTestHarness<>(operatorFactory, inputSerializer);
         harness.setup(outputSerializer);
         return harness;
     }
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperatorTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperatorTest.java
index f3693fe405ded..f00229d99890e 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperatorTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/CdcRecordStoreWriteOperatorTest.java
@@ -253,8 +253,8 @@ public void testUpdateColumnType() throws Exception {
 
     private OneInputStreamOperatorTestHarness<CdcRecord, Committable> createTestHarness(
             FileStoreTable table) throws Exception {
-        CdcRecordStoreWriteOperator operator =
-                new CdcRecordStoreWriteOperator(
+        CdcRecordStoreWriteOperator.Factory operatorFactory =
+                new CdcRecordStoreWriteOperator.Factory(
                         table,
                         (t, commitUser, state, ioManager, memoryPool, metricGroup) ->
                                 new StoreSinkWriteImpl(
@@ -272,7 +272,7 @@ private OneInputStreamOperatorTestHarness<CdcRecord, Committable> createTestHarn
         TypeSerializer<Committable> outputSerializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<CdcRecord, Committable> harness =
-                new OneInputStreamOperatorTestHarness<>(operator, inputSerializer);
+                new OneInputStreamOperatorTestHarness<>(operatorFactory, inputSerializer);
         harness.setup(outputSerializer);
         return harness;
     }
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
index fd23e500d5e55..e1bd112ca751e 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
@@ -60,7 +60,6 @@ public void cancel() {}
                         () -> FlinkCatalogFactory.createPaimonCatalog(new Options()),
                         FlinkConnectorOptions.SINK_COMMITTER_CPU.defaultValue(),
                         null,
-                        true,
                         UUID.randomUUID().toString());
         DataStreamSink<?> dataStreamSink = sink.sinkFrom(input);
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendBypassCompactWorkerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendBypassCompactWorkerOperator.java
index 92cd31ea8aa26..977511920a061 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendBypassCompactWorkerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendBypassCompactWorkerOperator.java
@@ -21,7 +21,9 @@
 import org.apache.paimon.append.UnawareAppendCompactionTask;
 import org.apache.paimon.table.FileStoreTable;
 
-import org.apache.flink.streaming.api.operators.ChainingStrategy;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.types.Either;
 
@@ -29,9 +31,11 @@
 public class AppendBypassCompactWorkerOperator
         extends AppendCompactWorkerOperator<Either<Committable, UnawareAppendCompactionTask>> {
 
-    public AppendBypassCompactWorkerOperator(FileStoreTable table, String commitUser) {
-        super(table, commitUser);
-        this.chainingStrategy = ChainingStrategy.HEAD;
+    private AppendBypassCompactWorkerOperator(
+            StreamOperatorParameters<Committable> parameters,
+            FileStoreTable table,
+            String commitUser) {
+        super(parameters, table, commitUser);
     }
 
     @Override
@@ -49,4 +53,27 @@ public void processElement(
             unawareBucketCompactor.processElement(element.getValue().right());
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link AppendBypassCompactWorkerOperator}. */
+    public static class Factory
+            extends AppendCompactWorkerOperator.Factory<
+                    Either<Committable, UnawareAppendCompactionTask>> {
+
+        public Factory(FileStoreTable table, String initialCommitUser) {
+            super(table, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T) new AppendBypassCompactWorkerOperator(parameters, table, commitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return AppendBypassCompactWorkerOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendCompactWorkerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendCompactWorkerOperator.java
index 52ab75de6b2c3..7a3c0231eb65d 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendCompactWorkerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendCompactWorkerOperator.java
@@ -27,6 +27,8 @@
 import org.apache.paimon.table.sink.CommitMessage;
 import org.apache.paimon.utils.ExecutorThreadFactory;
 
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
@@ -53,8 +55,11 @@ public abstract class AppendCompactWorkerOperator<IN>
 
     private transient ExecutorService lazyCompactExecutor;
 
-    public AppendCompactWorkerOperator(FileStoreTable table, String commitUser) {
-        super(Options.fromMap(table.options()));
+    public AppendCompactWorkerOperator(
+            StreamOperatorParameters<Committable> parameters,
+            FileStoreTable table,
+            String commitUser) {
+        super(parameters, Options.fromMap(table.options()));
         this.table = table;
         this.commitUser = commitUser;
     }
@@ -101,4 +106,17 @@ public void close() throws Exception {
             this.unawareBucketCompactor.close();
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link AppendCompactWorkerOperator}. */
+    protected abstract static class Factory<IN>
+            extends PrepareCommitOperator.Factory<IN, Committable> {
+        protected final FileStoreTable table;
+        protected final String commitUser;
+
+        protected Factory(FileStoreTable table, String commitUser) {
+            super(Options.fromMap(table.options()));
+            this.table = table;
+            this.commitUser = commitUser;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperator.java
index 15e7b9746fe6c..83d51f302e51f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperator.java
@@ -28,6 +28,9 @@
 import org.apache.paimon.utils.ExceptionUtils;
 import org.apache.paimon.utils.ExecutorThreadFactory;
 
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -62,9 +65,12 @@ public class AppendOnlyMultiTableCompactionWorkerOperator
 
     private transient Catalog catalog;
 
-    public AppendOnlyMultiTableCompactionWorkerOperator(
-            Catalog.Loader catalogLoader, String commitUser, Options options) {
-        super(options);
+    private AppendOnlyMultiTableCompactionWorkerOperator(
+            StreamOperatorParameters<MultiTableCommittable> parameters,
+            Catalog.Loader catalogLoader,
+            String commitUser,
+            Options options) {
+        super(parameters, options);
         this.commitUser = commitUser;
         this.catalogLoader = catalogLoader;
     }
@@ -175,4 +181,34 @@ public void close() throws Exception {
 
         ExceptionUtils.throwMultiException(exceptions);
     }
+
+    /** {@link StreamOperatorFactory} of {@link AppendOnlyMultiTableCompactionWorkerOperator}. */
+    public static class Factory
+            extends PrepareCommitOperator.Factory<
+                    MultiTableUnawareAppendCompactionTask, MultiTableCommittable> {
+
+        private final String commitUser;
+        private final Catalog.Loader catalogLoader;
+
+        public Factory(Catalog.Loader catalogLoader, String commitUser, Options options) {
+            super(options);
+            this.commitUser = commitUser;
+            this.catalogLoader = catalogLoader;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<MultiTableCommittable>> T createStreamOperator(
+                StreamOperatorParameters<MultiTableCommittable> parameters) {
+            return (T)
+                    new AppendOnlyMultiTableCompactionWorkerOperator(
+                            parameters, catalogLoader, commitUser, options);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return AppendOnlyMultiTableCompactionWorkerOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperator.java
index 4d0201d324615..917a7f64f1a04 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperator.java
@@ -22,6 +22,9 @@
 import org.apache.paimon.flink.source.BucketUnawareCompactSource;
 import org.apache.paimon.table.FileStoreTable;
 
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 /**
@@ -31,12 +34,39 @@
 public class AppendOnlySingleTableCompactionWorkerOperator
         extends AppendCompactWorkerOperator<UnawareAppendCompactionTask> {
 
-    public AppendOnlySingleTableCompactionWorkerOperator(FileStoreTable table, String commitUser) {
-        super(table, commitUser);
+    private AppendOnlySingleTableCompactionWorkerOperator(
+            StreamOperatorParameters<Committable> parameters,
+            FileStoreTable table,
+            String commitUser) {
+        super(parameters, table, commitUser);
     }
 
     @Override
     public void processElement(StreamRecord<UnawareAppendCompactionTask> element) throws Exception {
         this.unawareBucketCompactor.processElement(element.getValue());
     }
+
+    /** {@link StreamOperatorFactory} of {@link AppendOnlySingleTableCompactionWorkerOperator}. */
+    public static class Factory
+            extends AppendCompactWorkerOperator.Factory<UnawareAppendCompactionTask> {
+
+        public Factory(FileStoreTable table, String initialCommitUser) {
+            super(table, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new AppendOnlySingleTableCompactionWorkerOperator(
+                            parameters, table, commitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return AppendOnlySingleTableCompactionWorkerOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperator.java
index 6d27c60194837..0822f04612413 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperator.java
@@ -32,18 +32,13 @@
 import org.apache.flink.runtime.checkpoint.CheckpointOptions;
 import org.apache.flink.runtime.jobgraph.OperatorID;
 import org.apache.flink.runtime.state.CheckpointStreamFactory;
-import org.apache.flink.streaming.api.graph.StreamConfig;
 import org.apache.flink.streaming.api.operators.BoundedOneInput;
-import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
 import org.apache.flink.streaming.api.operators.OperatorSnapshotFutures;
-import org.apache.flink.streaming.api.operators.Output;
-import org.apache.flink.streaming.api.operators.SetupableStreamOperator;
 import org.apache.flink.streaming.api.operators.StreamTaskStateInitializer;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.LatencyMarker;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
-import org.apache.flink.streaming.runtime.tasks.StreamTask;
 import org.apache.flink.streaming.runtime.watermarkstatus.WatermarkStatus;
 
 import java.time.Duration;
@@ -58,9 +53,7 @@
  * time, tags are automatically created for each flink savepoint.
  */
 public class AutoTagForSavepointCommitterOperator<CommitT, GlobalCommitT>
-        implements OneInputStreamOperator<CommitT, CommitT>,
-                SetupableStreamOperator,
-                BoundedOneInput {
+        implements OneInputStreamOperator<CommitT, CommitT>, BoundedOneInput {
     public static final String SAVEPOINT_TAG_PREFIX = "savepoint-";
 
     private static final long serialVersionUID = 1L;
@@ -256,19 +249,4 @@ public void setKeyContextElement(StreamRecord<CommitT> record) throws Exception
     public void endInput() throws Exception {
         commitOperator.endInput();
     }
-
-    @Override
-    public void setup(StreamTask containingTask, StreamConfig config, Output output) {
-        commitOperator.setup(containingTask, config, output);
-    }
-
-    @Override
-    public ChainingStrategy getChainingStrategy() {
-        return commitOperator.getChainingStrategy();
-    }
-
-    @Override
-    public void setChainingStrategy(ChainingStrategy strategy) {
-        commitOperator.setChainingStrategy(strategy);
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorFactory.java
new file mode 100644
index 0000000000000..1787f8e7adce5
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorFactory.java
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.sink;
+
+import org.apache.paimon.operation.TagDeletion;
+import org.apache.paimon.table.sink.TagCallback;
+import org.apache.paimon.utils.SerializableSupplier;
+import org.apache.paimon.utils.SnapshotManager;
+import org.apache.paimon.utils.TagManager;
+
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
+
+import java.time.Duration;
+import java.util.List;
+import java.util.NavigableSet;
+import java.util.TreeSet;
+
+/**
+ * {@link org.apache.flink.streaming.api.operators.StreamOperatorFactory} for {@link
+ * AutoTagForSavepointCommitterOperator}.
+ */
+public class AutoTagForSavepointCommitterOperatorFactory<CommitT, GlobalCommitT>
+        extends AbstractStreamOperatorFactory<CommitT>
+        implements OneInputStreamOperatorFactory<CommitT, CommitT> {
+
+    private final CommitterOperatorFactory<CommitT, GlobalCommitT> commitOperatorFactory;
+
+    private final SerializableSupplier<SnapshotManager> snapshotManagerFactory;
+
+    private final SerializableSupplier<TagManager> tagManagerFactory;
+
+    private final SerializableSupplier<TagDeletion> tagDeletionFactory;
+
+    private final SerializableSupplier<List<TagCallback>> callbacksSupplier;
+
+    private final NavigableSet<Long> identifiersForTags;
+
+    private final Duration tagTimeRetained;
+
+    public AutoTagForSavepointCommitterOperatorFactory(
+            CommitterOperatorFactory<CommitT, GlobalCommitT> commitOperatorFactory,
+            SerializableSupplier<SnapshotManager> snapshotManagerFactory,
+            SerializableSupplier<TagManager> tagManagerFactory,
+            SerializableSupplier<TagDeletion> tagDeletionFactory,
+            SerializableSupplier<List<TagCallback>> callbacksSupplier,
+            Duration tagTimeRetained) {
+        this.commitOperatorFactory = commitOperatorFactory;
+        this.tagManagerFactory = tagManagerFactory;
+        this.snapshotManagerFactory = snapshotManagerFactory;
+        this.tagDeletionFactory = tagDeletionFactory;
+        this.callbacksSupplier = callbacksSupplier;
+        this.identifiersForTags = new TreeSet<>();
+        this.tagTimeRetained = tagTimeRetained;
+    }
+
+    @Override
+    @SuppressWarnings("unchecked")
+    public <T extends StreamOperator<CommitT>> T createStreamOperator(
+            StreamOperatorParameters<CommitT> parameters) {
+        return (T)
+                new AutoTagForSavepointCommitterOperator<>(
+                        commitOperatorFactory.createStreamOperator(parameters),
+                        snapshotManagerFactory,
+                        tagManagerFactory,
+                        tagDeletionFactory,
+                        callbacksSupplier,
+                        tagTimeRetained);
+    }
+
+    @Override
+    @SuppressWarnings("rawtypes")
+    public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+        return AutoTagForSavepointCommitterOperator.class;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperator.java
index 23202b45077ff..1cbcc4b2262fd 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperator.java
@@ -28,18 +28,13 @@
 import org.apache.flink.runtime.checkpoint.CheckpointOptions;
 import org.apache.flink.runtime.jobgraph.OperatorID;
 import org.apache.flink.runtime.state.CheckpointStreamFactory;
-import org.apache.flink.streaming.api.graph.StreamConfig;
 import org.apache.flink.streaming.api.operators.BoundedOneInput;
-import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
 import org.apache.flink.streaming.api.operators.OperatorSnapshotFutures;
-import org.apache.flink.streaming.api.operators.Output;
-import org.apache.flink.streaming.api.operators.SetupableStreamOperator;
 import org.apache.flink.streaming.api.operators.StreamTaskStateInitializer;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.LatencyMarker;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
-import org.apache.flink.streaming.runtime.tasks.StreamTask;
 import org.apache.flink.streaming.runtime.watermarkstatus.WatermarkStatus;
 
 import java.time.Instant;
@@ -53,9 +48,7 @@
  * completed, the corresponding tag is generated.
  */
 public class BatchWriteGeneratorTagOperator<CommitT, GlobalCommitT>
-        implements OneInputStreamOperator<CommitT, CommitT>,
-                SetupableStreamOperator,
-                BoundedOneInput {
+        implements OneInputStreamOperator<CommitT, CommitT>, BoundedOneInput {
 
     private static final String BATCH_WRITE_TAG_PREFIX = "batch-write-";
 
@@ -250,19 +243,4 @@ public void setKeyContextElement(StreamRecord<CommitT> record) throws Exception
     public void endInput() throws Exception {
         commitOperator.endInput();
     }
-
-    @Override
-    public void setup(StreamTask containingTask, StreamConfig config, Output output) {
-        commitOperator.setup(containingTask, config, output);
-    }
-
-    @Override
-    public ChainingStrategy getChainingStrategy() {
-        return commitOperator.getChainingStrategy();
-    }
-
-    @Override
-    public void setChainingStrategy(ChainingStrategy strategy) {
-        commitOperator.setChainingStrategy(strategy);
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorFactory.java
new file mode 100644
index 0000000000000..e3c0e5c491680
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorFactory.java
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.sink;
+
+import org.apache.paimon.table.FileStoreTable;
+
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
+
+/**
+ * {@link org.apache.flink.streaming.api.operators.StreamOperatorFactory} for {@link
+ * BatchWriteGeneratorTagOperator}.
+ */
+public class BatchWriteGeneratorTagOperatorFactory<CommitT, GlobalCommitT>
+        extends AbstractStreamOperatorFactory<CommitT>
+        implements OneInputStreamOperatorFactory<CommitT, CommitT> {
+    private final CommitterOperatorFactory<CommitT, GlobalCommitT> commitOperatorFactory;
+
+    protected final FileStoreTable table;
+
+    public BatchWriteGeneratorTagOperatorFactory(
+            CommitterOperatorFactory<CommitT, GlobalCommitT> commitOperatorFactory,
+            FileStoreTable table) {
+        this.table = table;
+        this.commitOperatorFactory = commitOperatorFactory;
+    }
+
+    @Override
+    @SuppressWarnings("unchecked")
+    public <T extends StreamOperator<CommitT>> T createStreamOperator(
+            StreamOperatorParameters<CommitT> parameters) {
+        return (T)
+                new BatchWriteGeneratorTagOperator<>(
+                        commitOperatorFactory.createStreamOperator(parameters), table);
+    }
+
+    @Override
+    @SuppressWarnings("rawtypes")
+    public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+        return BatchWriteGeneratorTagOperator.class;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
index ce4e37305909a..c2b4cc0f87e60 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
@@ -33,7 +33,7 @@
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.table.data.RowData;
 
 import java.io.Serializable;
@@ -119,7 +119,7 @@ public DataStream<MultiTableCommittable> doWrite(
                         .transform(
                                 String.format("%s-%s", "Unaware-Bucket-Table", WRITER_NAME),
                                 new MultiTableCommittableTypeInfo(),
-                                new AppendOnlyMultiTableCompactionWorkerOperator(
+                                new AppendOnlyMultiTableCompactionWorkerOperator.Factory(
                                         catalogLoader, commitUser, options))
                         .setParallelism(unawareBucketTableSource.getParallelism());
 
@@ -160,26 +160,28 @@ protected DataStreamSink<?> doCommit(
                         .transform(
                                 GLOBAL_COMMITTER_NAME,
                                 new MultiTableCommittableTypeInfo(),
-                                new CommitterOperator<>(
+                                new CommitterOperatorFactory<>(
                                         streamingCheckpointEnabled,
                                         false,
-                                        options.get(SINK_COMMITTER_OPERATOR_CHAINING),
                                         commitUser,
                                         createCommitterFactory(isStreaming),
                                         createCommittableStateManager(),
                                         options.get(END_INPUT_WATERMARK)))
                         .setParallelism(written.getParallelism());
+        if (!options.get(SINK_COMMITTER_OPERATOR_CHAINING)) {
+            committed = committed.startNewChain();
+        }
         return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
     // TODO:refactor FlinkSink to adopt this sink
-    protected OneInputStreamOperator<RowData, MultiTableCommittable>
+    protected OneInputStreamOperatorFactory<RowData, MultiTableCommittable>
             combinedMultiComacptionWriteOperator(
                     CheckpointConfig checkpointConfig,
                     boolean isStreaming,
                     boolean fullCompaction,
                     String commitUser) {
-        return new MultiTablesStoreCompactOperator(
+        return new MultiTablesStoreCompactOperator.Factory(
                 catalogLoader,
                 commitUser,
                 checkpointConfig,
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
index 021a5db413d54..383cbcd6ebf71 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperator.java
@@ -25,8 +25,8 @@
 import org.apache.flink.runtime.state.StateSnapshotContext;
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
 import org.apache.flink.streaming.api.operators.BoundedOneInput;
-import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
@@ -91,26 +91,9 @@ public class CommitterOperator<CommitT, GlobalCommitT> extends AbstractStreamOpe
     private final Long endInputWatermark;
 
     public CommitterOperator(
+            StreamOperatorParameters<CommitT> parameters,
             boolean streamingCheckpointEnabled,
             boolean forceSingleParallelism,
-            boolean chaining,
-            String initialCommitUser,
-            Committer.Factory<CommitT, GlobalCommitT> committerFactory,
-            CommittableStateManager<GlobalCommitT> committableStateManager) {
-        this(
-                streamingCheckpointEnabled,
-                forceSingleParallelism,
-                chaining,
-                initialCommitUser,
-                committerFactory,
-                committableStateManager,
-                null);
-    }
-
-    public CommitterOperator(
-            boolean streamingCheckpointEnabled,
-            boolean forceSingleParallelism,
-            boolean chaining,
             String initialCommitUser,
             Committer.Factory<CommitT, GlobalCommitT> committerFactory,
             CommittableStateManager<GlobalCommitT> committableStateManager,
@@ -122,7 +105,10 @@ public CommitterOperator(
         this.committerFactory = checkNotNull(committerFactory);
         this.committableStateManager = committableStateManager;
         this.endInputWatermark = endInputWatermark;
-        setChainingStrategy(chaining ? ChainingStrategy.ALWAYS : ChainingStrategy.HEAD);
+        this.setup(
+                parameters.getContainingTask(),
+                parameters.getStreamConfig(),
+                parameters.getOutput());
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperatorFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperatorFactory.java
new file mode 100644
index 0000000000000..cce3d4e176bf8
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CommitterOperatorFactory.java
@@ -0,0 +1,115 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.sink;
+
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
+
+import java.util.NavigableMap;
+import java.util.TreeMap;
+
+import static org.apache.paimon.utils.Preconditions.checkNotNull;
+
+/**
+ * {@link org.apache.flink.streaming.api.operators.StreamOperatorFactory} for {@link
+ * CommitterOperator}.
+ */
+public class CommitterOperatorFactory<CommitT, GlobalCommitT>
+        extends AbstractStreamOperatorFactory<CommitT>
+        implements OneInputStreamOperatorFactory<CommitT, CommitT> {
+    protected final boolean streamingCheckpointEnabled;
+
+    /** Whether to check the parallelism while runtime. */
+    protected final boolean forceSingleParallelism;
+    /**
+     * This commitUser is valid only for new jobs. After the job starts, this commitUser will be
+     * recorded into the states of write and commit operators. When the job restarts, commitUser
+     * will be recovered from states and this value is ignored.
+     */
+    protected final String initialCommitUser;
+
+    /** Group the committable by the checkpoint id. */
+    protected final NavigableMap<Long, GlobalCommitT> committablesPerCheckpoint;
+
+    protected final Committer.Factory<CommitT, GlobalCommitT> committerFactory;
+
+    protected final CommittableStateManager<GlobalCommitT> committableStateManager;
+
+    /**
+     * Aggregate committables to global committables and commit the global committables to the
+     * external system.
+     */
+    protected Committer<CommitT, GlobalCommitT> committer;
+
+    protected final Long endInputWatermark;
+
+    public CommitterOperatorFactory(
+            boolean streamingCheckpointEnabled,
+            boolean forceSingleParallelism,
+            String initialCommitUser,
+            Committer.Factory<CommitT, GlobalCommitT> committerFactory,
+            CommittableStateManager<GlobalCommitT> committableStateManager) {
+        this(
+                streamingCheckpointEnabled,
+                forceSingleParallelism,
+                initialCommitUser,
+                committerFactory,
+                committableStateManager,
+                null);
+    }
+
+    public CommitterOperatorFactory(
+            boolean streamingCheckpointEnabled,
+            boolean forceSingleParallelism,
+            String initialCommitUser,
+            Committer.Factory<CommitT, GlobalCommitT> committerFactory,
+            CommittableStateManager<GlobalCommitT> committableStateManager,
+            Long endInputWatermark) {
+        this.streamingCheckpointEnabled = streamingCheckpointEnabled;
+        this.forceSingleParallelism = forceSingleParallelism;
+        this.initialCommitUser = initialCommitUser;
+        this.committablesPerCheckpoint = new TreeMap<>();
+        this.committerFactory = checkNotNull(committerFactory);
+        this.committableStateManager = committableStateManager;
+        this.endInputWatermark = endInputWatermark;
+    }
+
+    @Override
+    @SuppressWarnings("unchecked")
+    public <T extends StreamOperator<CommitT>> T createStreamOperator(
+            StreamOperatorParameters<CommitT> parameters) {
+        return (T)
+                new CommitterOperator<>(
+                        parameters,
+                        streamingCheckpointEnabled,
+                        forceSingleParallelism,
+                        initialCommitUser,
+                        committerFactory,
+                        committableStateManager,
+                        endInputWatermark);
+    }
+
+    @Override
+    @SuppressWarnings("rawtypes")
+    public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+        return CommitterOperator.class;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
index a0c830d73f582..a9c6031dfa346 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CompactorSink.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.manifest.ManifestCommittable;
 import org.apache.paimon.table.FileStoreTable;
 
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.table.data.RowData;
 
 /** {@link FlinkSink} for dedicated compact jobs. */
@@ -37,9 +37,9 @@ public CompactorSink(FileStoreTable table, boolean fullCompaction) {
     }
 
     @Override
-    protected OneInputStreamOperator<RowData, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<RowData, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new StoreCompactOperator(table, writeProvider, commitUser, fullCompaction);
+        return new StoreCompactOperator.Factory(table, writeProvider, commitUser, fullCompaction);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/DynamicBucketRowWriteOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/DynamicBucketRowWriteOperator.java
index 53b9be457c3d8..b31a1af05224f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/DynamicBucketRowWriteOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/DynamicBucketRowWriteOperator.java
@@ -22,6 +22,9 @@
 import org.apache.paimon.table.FileStoreTable;
 
 import org.apache.flink.api.java.tuple.Tuple2;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 /**
@@ -32,11 +35,12 @@ public class DynamicBucketRowWriteOperator
 
     private static final long serialVersionUID = 1L;
 
-    public DynamicBucketRowWriteOperator(
+    private DynamicBucketRowWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(table, storeSinkWriteProvider, initialCommitUser);
+        super(parameters, table, storeSinkWriteProvider, initialCommitUser);
     }
 
     @Override
@@ -49,4 +53,30 @@ public void processElement(StreamRecord<Tuple2<InternalRow, Integer>> element)
             throws Exception {
         write.write(element.getValue().f0, element.getValue().f1);
     }
+
+    /** {@link StreamOperatorFactory} of {@link DynamicBucketRowWriteOperator}. */
+    public static class Factory extends TableWriteOperator.Factory<Tuple2<InternalRow, Integer>> {
+
+        public Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new DynamicBucketRowWriteOperator(
+                            parameters, table, storeSinkWriteProvider, initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return DynamicBucketRowWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FixedBucketSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FixedBucketSink.java
index 613bf369b0524..402abb4d5aac0 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FixedBucketSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FixedBucketSink.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.table.FileStoreTable;
 
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
 
@@ -43,8 +43,9 @@ public FixedBucketSink(
     }
 
     @Override
-    protected OneInputStreamOperator<InternalRow, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<InternalRow, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new RowDataStoreWriteOperator(table, logSinkFunction, writeProvider, commitUser);
+        return new RowDataStoreWriteOperator.Factory(
+                table, logSinkFunction, writeProvider, commitUser);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
index dd364c196d8bf..8d6c3554c76ff 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
@@ -44,7 +44,7 @@
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.table.api.config.ExecutionConfigOptions;
 
 import javax.annotation.Nullable;
@@ -220,7 +220,7 @@ public DataStream<Committable> doWrite(
                                         + " : "
                                         + table.name(),
                                 new CommittableTypeInfo(),
-                                createWriteOperator(
+                                createWriteOperatorFactory(
                                         createWriteProvider(
                                                 env.getCheckpointConfig(),
                                                 isStreaming,
@@ -268,11 +268,10 @@ protected DataStreamSink<?> doCommit(DataStream<Committable> written, String com
         }
 
         Options options = Options.fromMap(table.options());
-        OneInputStreamOperator<Committable, Committable> committerOperator =
-                new CommitterOperator<>(
+        OneInputStreamOperatorFactory<Committable, Committable> committerOperator =
+                new CommitterOperatorFactory<>(
                         streamingCheckpointEnabled,
                         true,
-                        options.get(SINK_COMMITTER_OPERATOR_CHAINING),
                         commitUser,
                         createCommitterFactory(),
                         createCommittableStateManager(),
@@ -280,8 +279,9 @@ protected DataStreamSink<?> doCommit(DataStream<Committable> written, String com
 
         if (options.get(SINK_AUTO_TAG_FOR_SAVEPOINT)) {
             committerOperator =
-                    new AutoTagForSavepointCommitterOperator<>(
-                            (CommitterOperator<Committable, ManifestCommittable>) committerOperator,
+                    new AutoTagForSavepointCommitterOperatorFactory<>(
+                            (CommitterOperatorFactory<Committable, ManifestCommittable>)
+                                    committerOperator,
                             table::snapshotManager,
                             table::tagManager,
                             () -> table.store().newTagDeletion(),
@@ -291,8 +291,9 @@ protected DataStreamSink<?> doCommit(DataStream<Committable> written, String com
         if (conf.get(ExecutionOptions.RUNTIME_MODE) == RuntimeExecutionMode.BATCH
                 && table.coreOptions().tagCreationMode() == TagCreationMode.BATCH) {
             committerOperator =
-                    new BatchWriteGeneratorTagOperator<>(
-                            (CommitterOperator<Committable, ManifestCommittable>) committerOperator,
+                    new BatchWriteGeneratorTagOperatorFactory<>(
+                            (CommitterOperatorFactory<Committable, ManifestCommittable>)
+                                    committerOperator,
                             table);
         }
         SingleOutputStreamOperator<?> committed =
@@ -310,6 +311,9 @@ protected DataStreamSink<?> doCommit(DataStream<Committable> written, String com
                                     table.name(),
                                     options.get(SINK_OPERATOR_UID_SUFFIX)));
         }
+        if (!options.get(SINK_COMMITTER_OPERATOR_CHAINING)) {
+            committed = committed.startNewChain();
+        }
         configureGlobalCommitter(
                 committed, options.get(SINK_COMMITTER_CPU), options.get(SINK_COMMITTER_MEMORY));
         return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
@@ -362,7 +366,7 @@ public static void assertBatchAdaptiveParallelism(
         }
     }
 
-    protected abstract OneInputStreamOperator<T, Committable> createWriteOperator(
+    protected abstract OneInputStreamOperatorFactory<T, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser);
 
     protected abstract Committer.Factory<Committable, ManifestCommittable> createCommitterFactory();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
index dcccd0a1a988b..5703c408243bd 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
@@ -222,7 +222,7 @@ public DataStreamSink<?> build() {
                             .transform(
                                     "local merge",
                                     input.getType(),
-                                    new LocalMergeOperator(table.schema()))
+                                    new LocalMergeOperator.Factory(table.schema()))
                             .setParallelism(input.getParallelism());
         }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/LocalMergeOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/LocalMergeOperator.java
index 6931fe9072180..070262147643f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/LocalMergeOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/LocalMergeOperator.java
@@ -44,10 +44,15 @@
 import org.apache.paimon.utils.UserDefinedSeqComparator;
 
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
 import org.apache.flink.streaming.api.operators.BoundedOneInput;
 import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.streaming.api.operators.Output;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
@@ -76,13 +81,14 @@ public class LocalMergeOperator extends AbstractStreamOperator<InternalRow>
 
     private transient boolean endOfInput;
 
-    public LocalMergeOperator(TableSchema schema) {
+    private LocalMergeOperator(
+            StreamOperatorParameters<InternalRow> parameters, TableSchema schema) {
         Preconditions.checkArgument(
                 schema.primaryKeys().size() > 0,
                 "LocalMergeOperator currently only support tables with primary keys");
         this.schema = schema;
         this.ignoreDelete = CoreOptions.fromMap(schema.options()).ignoreDelete();
-        setChainingStrategy(ChainingStrategy.ALWAYS);
+        setup(parameters.getContainingTask(), parameters.getStreamConfig(), parameters.getOutput());
     }
 
     @Override
@@ -235,4 +241,28 @@ LocalMerger merger() {
     void setOutput(Output<StreamRecord<InternalRow>> output) {
         this.output = output;
     }
+
+    /** {@link StreamOperatorFactory} of {@link LocalMergeOperator}. */
+    public static class Factory extends AbstractStreamOperatorFactory<InternalRow>
+            implements OneInputStreamOperatorFactory<InternalRow, InternalRow> {
+        private final TableSchema schema;
+
+        public Factory(TableSchema schema) {
+            this.chainingStrategy = ChainingStrategy.ALWAYS;
+            this.schema = schema;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<InternalRow>> T createStreamOperator(
+                StreamOperatorParameters<InternalRow> parameters) {
+            return (T) new LocalMergeOperator(parameters, schema);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return LocalMergeOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
index 57d2e8413cb5b..58f6a3834096c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/MultiTablesStoreCompactOperator.java
@@ -33,6 +33,9 @@
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.runtime.state.StateSnapshotContext;
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.table.data.RowData;
 
@@ -76,7 +79,8 @@ public class MultiTablesStoreCompactOperator
     protected Map<Identifier, StoreSinkWrite> writes;
     protected String commitUser;
 
-    public MultiTablesStoreCompactOperator(
+    private MultiTablesStoreCompactOperator(
+            StreamOperatorParameters<MultiTableCommittable> parameters,
             Catalog.Loader catalogLoader,
             String initialCommitUser,
             CheckpointConfig checkpointConfig,
@@ -84,7 +88,7 @@ public MultiTablesStoreCompactOperator(
             boolean ignorePreviousFiles,
             boolean fullCompaction,
             Options options) {
-        super(options);
+        super(parameters, options);
         this.catalogLoader = catalogLoader;
         this.initialCommitUser = initialCommitUser;
         this.checkpointConfig = checkpointConfig;
@@ -316,4 +320,54 @@ private StoreSinkWrite.Provider createWriteProvider(
                         memoryPool,
                         metricGroup);
     }
+
+    /** {@link StreamOperatorFactory} of {@link MultiTablesStoreCompactOperator}. */
+    public static class Factory
+            extends PrepareCommitOperator.Factory<RowData, MultiTableCommittable> {
+        private final Catalog.Loader catalogLoader;
+        private final CheckpointConfig checkpointConfig;
+        private final boolean isStreaming;
+        private final boolean ignorePreviousFiles;
+        private final boolean fullCompaction;
+        private final String initialCommitUser;
+
+        public Factory(
+                Catalog.Loader catalogLoader,
+                String initialCommitUser,
+                CheckpointConfig checkpointConfig,
+                boolean isStreaming,
+                boolean ignorePreviousFiles,
+                boolean fullCompaction,
+                Options options) {
+            super(options);
+            this.catalogLoader = catalogLoader;
+            this.initialCommitUser = initialCommitUser;
+            this.checkpointConfig = checkpointConfig;
+            this.isStreaming = isStreaming;
+            this.ignorePreviousFiles = ignorePreviousFiles;
+            this.fullCompaction = fullCompaction;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<MultiTableCommittable>> T createStreamOperator(
+                StreamOperatorParameters<MultiTableCommittable> parameters) {
+            return (T)
+                    new MultiTablesStoreCompactOperator(
+                            parameters,
+                            catalogLoader,
+                            initialCommitUser,
+                            checkpointConfig,
+                            isStreaming,
+                            ignorePreviousFiles,
+                            fullCompaction,
+                            options);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return MultiTablesStoreCompactOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/PrepareCommitOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/PrepareCommitOperator.java
index 3668386ddc2db..8b114d3e492ff 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/PrepareCommitOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/PrepareCommitOperator.java
@@ -26,10 +26,14 @@
 import org.apache.flink.runtime.memory.MemoryManager;
 import org.apache.flink.streaming.api.graph.StreamConfig;
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
 import org.apache.flink.streaming.api.operators.BoundedOneInput;
 import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.streaming.api.operators.Output;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.streaming.runtime.tasks.StreamTask;
 
@@ -52,9 +56,9 @@ public abstract class PrepareCommitOperator<IN, OUT> extends AbstractStreamOpera
     private final Options options;
     private boolean endOfInput = false;
 
-    public PrepareCommitOperator(Options options) {
+    public PrepareCommitOperator(StreamOperatorParameters<OUT> parameters, Options options) {
         this.options = options;
-        setChainingStrategy(ChainingStrategy.ALWAYS);
+        setup(parameters.getContainingTask(), parameters.getStreamConfig(), parameters.getOutput());
     }
 
     @Override
@@ -103,4 +107,15 @@ private void emitCommittables(boolean waitCompaction, long checkpointId) throws
 
     protected abstract List<OUT> prepareCommit(boolean waitCompaction, long checkpointId)
             throws IOException;
+
+    /** {@link StreamOperatorFactory} of {@link PrepareCommitOperator}. */
+    protected abstract static class Factory<IN, OUT> extends AbstractStreamOperatorFactory<OUT>
+            implements OneInputStreamOperatorFactory<IN, OUT> {
+        protected final Options options;
+
+        protected Factory(Options options) {
+            this.options = options;
+            this.chainingStrategy = ChainingStrategy.ALWAYS;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RewriteFileIndexSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RewriteFileIndexSink.java
index 39dcca03c6aab..d9f863c6b9195 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RewriteFileIndexSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RewriteFileIndexSink.java
@@ -45,11 +45,10 @@
 import org.apache.paimon.utils.FileStorePathFactory;
 import org.apache.paimon.utils.Pair;
 
-import org.apache.flink.streaming.api.graph.StreamConfig;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
-import org.apache.flink.streaming.api.operators.Output;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
-import org.apache.flink.streaming.runtime.tasks.StreamTask;
 
 import javax.annotation.Nullable;
 
@@ -76,34 +75,49 @@ public RewriteFileIndexSink(FileStoreTable table) {
     }
 
     @Override
-    protected OneInputStreamOperator<ManifestEntry, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<ManifestEntry, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new FileIndexModificationOperator(table.coreOptions().toConfiguration(), table);
+        return new FileIndexModificationOperatorFactory(
+                table.coreOptions().toConfiguration(), table);
     }
 
-    /** File index modification operator to rewrite file index. */
-    private static class FileIndexModificationOperator
-            extends PrepareCommitOperator<ManifestEntry, Committable> {
-
-        private static final long serialVersionUID = 1L;
-
+    private static class FileIndexModificationOperatorFactory
+            extends PrepareCommitOperator.Factory<ManifestEntry, Committable> {
         private final FileStoreTable table;
 
-        private transient FileIndexProcessor fileIndexProcessor;
-        private transient List<CommitMessage> messages;
-
-        public FileIndexModificationOperator(Options options, FileStoreTable table) {
+        public FileIndexModificationOperatorFactory(Options options, FileStoreTable table) {
             super(options);
             this.table = table;
         }
 
         @Override
-        public void setup(
-                StreamTask<?, ?> containingTask,
-                StreamConfig config,
-                Output<StreamRecord<Committable>> output) {
-            super.setup(containingTask, config, output);
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T) new FileIndexModificationOperator(parameters, options, table);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return FileIndexModificationOperator.class;
+        }
+    }
+
+    /** File index modification operator to rewrite file index. */
+    private static class FileIndexModificationOperator
+            extends PrepareCommitOperator<ManifestEntry, Committable> {
+
+        private static final long serialVersionUID = 1L;
+
+        private final transient FileIndexProcessor fileIndexProcessor;
+        private final transient List<CommitMessage> messages;
 
+        private FileIndexModificationOperator(
+                StreamOperatorParameters<Committable> parameters,
+                Options options,
+                FileStoreTable table) {
+            super(parameters, options);
             this.fileIndexProcessor = new FileIndexProcessor(table);
             this.messages = new ArrayList<>();
         }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
index 2b25f074667c3..8009bec9677f7 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDataStoreWriteOperator.java
@@ -32,13 +32,13 @@
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.runtime.state.StateSnapshotContext;
 import org.apache.flink.streaming.api.functions.sink.SinkFunction;
-import org.apache.flink.streaming.api.graph.StreamConfig;
 import org.apache.flink.streaming.api.operators.InternalTimerService;
-import org.apache.flink.streaming.api.operators.Output;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.streaming.runtime.tasks.ProcessingTimeService;
-import org.apache.flink.streaming.runtime.tasks.StreamTask;
 import org.apache.flink.streaming.util.functions.StreamingFunctionUtils;
 
 import javax.annotation.Nullable;
@@ -61,21 +61,14 @@ public class RowDataStoreWriteOperator extends TableWriteOperator<InternalRow> {
     /** We listen to this ourselves because we don't have an {@link InternalTimerService}. */
     private long currentWatermark = Long.MIN_VALUE;
 
-    public RowDataStoreWriteOperator(
+    protected RowDataStoreWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             @Nullable LogSinkFunction logSinkFunction,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(table, storeSinkWriteProvider, initialCommitUser);
+        super(parameters, table, storeSinkWriteProvider, initialCommitUser);
         this.logSinkFunction = logSinkFunction;
-    }
-
-    @Override
-    public void setup(
-            StreamTask<?, ?> containingTask,
-            StreamConfig config,
-            Output<StreamRecord<Committable>> output) {
-        super.setup(containingTask, config, output);
         if (logSinkFunction != null) {
             FunctionUtils.setFunctionRuntimeContext(logSinkFunction, getRuntimeContext());
         }
@@ -249,4 +242,38 @@ public Long timestamp() {
             return timestamp;
         }
     }
+
+    /** {@link StreamOperatorFactory} of {@link RowDataStoreWriteOperator}. */
+    public static class Factory extends TableWriteOperator.Factory<InternalRow> {
+
+        @Nullable private final LogSinkFunction logSinkFunction;
+
+        public Factory(
+                FileStoreTable table,
+                @Nullable LogSinkFunction logSinkFunction,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(table, storeSinkWriteProvider, initialCommitUser);
+            this.logSinkFunction = logSinkFunction;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new RowDataStoreWriteOperator(
+                            parameters,
+                            table,
+                            logSinkFunction,
+                            storeSinkWriteProvider,
+                            initialCommitUser);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return RowDataStoreWriteOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDynamicBucketSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDynamicBucketSink.java
index bf6c70f0aa295..1f7e62d74916e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDynamicBucketSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowDynamicBucketSink.java
@@ -27,7 +27,7 @@
 import org.apache.paimon.utils.SerializableFunction;
 
 import org.apache.flink.api.java.tuple.Tuple2;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
 
@@ -60,8 +60,8 @@ protected ChannelComputer<Tuple2<InternalRow, Integer>> channelComputer2() {
     }
 
     @Override
-    protected OneInputStreamOperator<Tuple2<InternalRow, Integer>, Committable> createWriteOperator(
-            StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new DynamicBucketRowWriteOperator(table, writeProvider, commitUser);
+    protected OneInputStreamOperatorFactory<Tuple2<InternalRow, Integer>, Committable>
+            createWriteOperatorFactory(StoreSinkWrite.Provider writeProvider, String commitUser) {
+        return new DynamicBucketRowWriteOperator.Factory(table, writeProvider, commitUser);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowUnawareBucketSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowUnawareBucketSink.java
index 1cd10390c1a0a..fea8a382a954c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowUnawareBucketSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/RowUnawareBucketSink.java
@@ -22,7 +22,9 @@
 import org.apache.paimon.table.FileStoreTable;
 
 import org.apache.flink.runtime.state.StateInitializationContext;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 
 import java.util.Map;
 
@@ -38,25 +40,35 @@ public RowUnawareBucketSink(
     }
 
     @Override
-    protected OneInputStreamOperator<InternalRow, Committable> createWriteOperator(
+    protected OneInputStreamOperatorFactory<InternalRow, Committable> createWriteOperatorFactory(
             StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new RowDataStoreWriteOperator(table, logSinkFunction, writeProvider, commitUser) {
-
+        return new RowDataStoreWriteOperator.Factory(
+                table, logSinkFunction, writeProvider, commitUser) {
             @Override
-            protected StoreSinkWriteState createState(
-                    StateInitializationContext context,
-                    StoreSinkWriteState.StateValueFilter stateFilter)
-                    throws Exception {
-                // No conflicts will occur in append only unaware bucket writer, so no state is
-                // needed.
-                return new NoopStoreSinkWriteState(stateFilter);
-            }
+            public StreamOperator createStreamOperator(StreamOperatorParameters parameters) {
+                return new RowDataStoreWriteOperator(
+                        parameters, table, logSinkFunction, writeProvider, commitUser) {
 
-            @Override
-            protected String getCommitUser(StateInitializationContext context) throws Exception {
-                // No conflicts will occur in append only unaware bucket writer, so commitUser does
-                // not matter.
-                return commitUser;
+                    @Override
+                    protected StoreSinkWriteState createState(
+                            StateInitializationContext context,
+                            StoreSinkWriteState.StateValueFilter stateFilter)
+                            throws Exception {
+                        // No conflicts will occur in append only unaware bucket writer, so no state
+                        // is
+                        // needed.
+                        return new NoopStoreSinkWriteState(stateFilter);
+                    }
+
+                    @Override
+                    protected String getCommitUser(StateInitializationContext context)
+                            throws Exception {
+                        // No conflicts will occur in append only unaware bucket writer, so
+                        // commitUser does
+                        // not matter.
+                        return commitUser;
+                    }
+                };
             }
         };
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
index ac10345bc4257..1870a0493c2f1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/StoreCompactOperator.java
@@ -31,6 +31,9 @@
 
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.runtime.state.StateSnapshotContext;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.table.data.RowData;
 
@@ -60,12 +63,13 @@ public class StoreCompactOperator extends PrepareCommitOperator<RowData, Committ
     private transient DataFileMetaSerializer dataFileMetaSerializer;
     private transient Set<Pair<BinaryRow, Integer>> waitToCompact;
 
-    public StoreCompactOperator(
+    private StoreCompactOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser,
             boolean fullCompaction) {
-        super(Options.fromMap(table.options()));
+        super(parameters, Options.fromMap(table.options()));
         Preconditions.checkArgument(
                 !table.coreOptions().writeOnly(),
                 CoreOptions.WRITE_ONLY.key() + " should not be true for StoreCompactOperator.");
@@ -163,4 +167,46 @@ public void close() throws Exception {
         super.close();
         write.close();
     }
+
+    /** {@link StreamOperatorFactory} of {@link StoreCompactOperator}. */
+    public static class Factory extends PrepareCommitOperator.Factory<RowData, Committable> {
+        private final FileStoreTable table;
+        private final StoreSinkWrite.Provider storeSinkWriteProvider;
+        private final String initialCommitUser;
+        private final boolean fullCompaction;
+
+        public Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser,
+                boolean fullCompaction) {
+            super(Options.fromMap(table.options()));
+            Preconditions.checkArgument(
+                    !table.coreOptions().writeOnly(),
+                    CoreOptions.WRITE_ONLY.key() + " should not be true for StoreCompactOperator.");
+            this.table = table;
+            this.storeSinkWriteProvider = storeSinkWriteProvider;
+            this.initialCommitUser = initialCommitUser;
+            this.fullCompaction = fullCompaction;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <T extends StreamOperator<Committable>> T createStreamOperator(
+                StreamOperatorParameters<Committable> parameters) {
+            return (T)
+                    new StoreCompactOperator(
+                            parameters,
+                            table,
+                            storeSinkWriteProvider,
+                            initialCommitUser,
+                            fullCompaction);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return StoreCompactOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
index 32fcdd03bdfd5..fd876698c094a 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/TableWriteOperator.java
@@ -28,6 +28,8 @@
 
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.runtime.state.StateSnapshotContext;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.RecordAttributes;
 
 import java.io.IOException;
@@ -45,10 +47,11 @@ public abstract class TableWriteOperator<IN> extends PrepareCommitOperator<IN, C
     protected transient StoreSinkWrite write;
 
     public TableWriteOperator(
+            StreamOperatorParameters<Committable> parameters,
             FileStoreTable table,
             StoreSinkWrite.Provider storeSinkWriteProvider,
             String initialCommitUser) {
-        super(Options.fromMap(table.options()));
+        super(parameters, Options.fromMap(table.options()));
         this.table = table;
         this.storeSinkWriteProvider = storeSinkWriteProvider;
         this.initialCommitUser = initialCommitUser;
@@ -128,4 +131,22 @@ protected List<Committable> prepareCommit(boolean waitCompaction, long checkpoin
     public StoreSinkWrite getWrite() {
         return write;
     }
+
+    /** {@link StreamOperatorFactory} of {@link TableWriteOperator}. */
+    protected abstract static class Factory<IN>
+            extends PrepareCommitOperator.Factory<IN, Committable> {
+        protected final FileStoreTable table;
+        protected final StoreSinkWrite.Provider storeSinkWriteProvider;
+        protected final String initialCommitUser;
+
+        protected Factory(
+                FileStoreTable table,
+                StoreSinkWrite.Provider storeSinkWriteProvider,
+                String initialCommitUser) {
+            super(Options.fromMap(table.options()));
+            this.table = table;
+            this.storeSinkWriteProvider = storeSinkWriteProvider;
+            this.initialCommitUser = initialCommitUser;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketCompactionSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketCompactionSink.java
index da966d5e51566..7a4095f896cc3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketCompactionSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketCompactionSink.java
@@ -24,7 +24,7 @@
 
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 /** Compaction Sink for unaware-bucket table. */
 public class UnawareBucketCompactionSink extends FlinkSink<UnawareAppendCompactionTask> {
@@ -42,9 +42,9 @@ public static DataStreamSink<?> sink(
     }
 
     @Override
-    protected OneInputStreamOperator<UnawareAppendCompactionTask, Committable> createWriteOperator(
-            StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new AppendOnlySingleTableCompactionWorkerOperator(table, commitUser);
+    protected OneInputStreamOperatorFactory<UnawareAppendCompactionTask, Committable>
+            createWriteOperatorFactory(StoreSinkWrite.Provider writeProvider, String commitUser) {
+        return new AppendOnlySingleTableCompactionWorkerOperator.Factory(table, commitUser);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketSink.java
index 98b58aa8e96d3..7bc40d4c2080b 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/UnawareBucketSink.java
@@ -74,11 +74,14 @@ public DataStream<Committable> doWrite(
                                             new CommittableTypeInfo(),
                                             new CompactionTaskTypeInfo()),
                                     new AppendBypassCoordinateOperatorFactory<>(table))
+                            .startNewChain()
                             .forceNonParallel()
                             .transform(
                                     "Compact Worker: " + table.name(),
                                     new CommittableTypeInfo(),
-                                    new AppendBypassCompactWorkerOperator(table, initialCommitUser))
+                                    new AppendBypassCompactWorkerOperator.Factory(
+                                            table, initialCommitUser))
+                            .startNewChain()
                             .setParallelism(written.getParallelism());
         }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalDynamicBucketSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalDynamicBucketSink.java
index 26e080c32e834..7022002a43ba3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalDynamicBucketSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/GlobalDynamicBucketSink.java
@@ -39,7 +39,7 @@
 import org.apache.flink.api.java.typeutils.TupleTypeInfo;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
 
@@ -63,9 +63,9 @@ public GlobalDynamicBucketSink(
     }
 
     @Override
-    protected OneInputStreamOperator<Tuple2<InternalRow, Integer>, Committable> createWriteOperator(
-            StoreSinkWrite.Provider writeProvider, String commitUser) {
-        return new DynamicBucketRowWriteOperator(table, writeProvider, commitUser);
+    protected OneInputStreamOperatorFactory<Tuple2<InternalRow, Integer>, Committable>
+            createWriteOperatorFactory(StoreSinkWrite.Provider writeProvider, String commitUser) {
+        return new DynamicBucketRowWriteOperator.Factory(table, writeProvider, commitUser);
     }
 
     public DataStreamSink<?> build(DataStream<InternalRow> input, @Nullable Integer parallelism) {
@@ -89,7 +89,8 @@ public DataStreamSink<?> build(DataStream<InternalRow> input, @Nullable Integer
                                 new InternalTypeInfo<>(
                                         new KeyWithRowSerializer<>(
                                                 bootstrapSerializer, rowSerializer)),
-                                new IndexBootstrapOperator<>(new IndexBootstrap(table), r -> r))
+                                new IndexBootstrapOperator.Factory<>(
+                                        new IndexBootstrap(table), r -> r))
                         .setParallelism(input.getParallelism());
 
         // 1. shuffle by key hash
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
index 5c8ba8f9441f3..8136565f98cf8 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/index/IndexBootstrapOperator.java
@@ -27,8 +27,13 @@
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.runtime.state.StateInitializationContext;
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
+import org.apache.flink.streaming.api.operators.AbstractStreamOperatorFactory;
 import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 
 /** Operator for {@link IndexBootstrap}. */
@@ -40,11 +45,13 @@ public class IndexBootstrapOperator<T> extends AbstractStreamOperator<Tuple2<Key
     private final IndexBootstrap bootstrap;
     private final SerializableFunction<InternalRow, T> converter;
 
-    public IndexBootstrapOperator(
-            IndexBootstrap bootstrap, SerializableFunction<InternalRow, T> converter) {
+    private IndexBootstrapOperator(
+            StreamOperatorParameters<Tuple2<KeyPartOrRow, T>> parameters,
+            IndexBootstrap bootstrap,
+            SerializableFunction<InternalRow, T> converter) {
         this.bootstrap = bootstrap;
         this.converter = converter;
-        setChainingStrategy(ChainingStrategy.ALWAYS);
+        setup(parameters.getContainingTask(), parameters.getStreamConfig(), parameters.getOutput());
     }
 
     @Override
@@ -65,4 +72,30 @@ private void collect(InternalRow row) {
         output.collect(
                 new StreamRecord<>(new Tuple2<>(KeyPartOrRow.KEY_PART, converter.apply(row))));
     }
+
+    /** {@link StreamOperatorFactory} of {@link IndexBootstrapOperator}. */
+    public static class Factory<T> extends AbstractStreamOperatorFactory<Tuple2<KeyPartOrRow, T>>
+            implements OneInputStreamOperatorFactory<T, Tuple2<KeyPartOrRow, T>> {
+        private final IndexBootstrap bootstrap;
+        private final SerializableFunction<InternalRow, T> converter;
+
+        public Factory(IndexBootstrap bootstrap, SerializableFunction<InternalRow, T> converter) {
+            this.chainingStrategy = ChainingStrategy.ALWAYS;
+            this.bootstrap = bootstrap;
+            this.converter = converter;
+        }
+
+        @Override
+        @SuppressWarnings("unchecked")
+        public <OP extends StreamOperator<Tuple2<KeyPartOrRow, T>>> OP createStreamOperator(
+                StreamOperatorParameters<Tuple2<KeyPartOrRow, T>> parameters) {
+            return (OP) new IndexBootstrapOperator<>(parameters, bootstrap, converter);
+        }
+
+        @Override
+        @SuppressWarnings("rawtypes")
+        public Class<? extends StreamOperator> getStreamOperatorClass(ClassLoader classLoader) {
+            return IndexBootstrapOperator.class;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
index 45090f7b68b40..b8b0d61e10a96 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperator.java
@@ -26,8 +26,8 @@
 
 import org.apache.flink.api.common.operators.ProcessingTimeService.ProcessingTimeCallback;
 import org.apache.flink.streaming.api.operators.AbstractStreamOperator;
-import org.apache.flink.streaming.api.operators.ChainingStrategy;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
 import org.apache.flink.streaming.runtime.tasks.ProcessingTimeService;
 import org.apache.flink.types.Either;
@@ -58,10 +58,12 @@ public class AppendBypassCoordinateOperator<CommitT>
     private transient LinkedBlockingQueue<UnawareAppendCompactionTask> compactTasks;
 
     public AppendBypassCoordinateOperator(
-            FileStoreTable table, ProcessingTimeService processingTimeService) {
+            StreamOperatorParameters<Either<CommitT, UnawareAppendCompactionTask>> parameters,
+            FileStoreTable table,
+            ProcessingTimeService processingTimeService) {
         this.table = table;
         this.processingTimeService = processingTimeService;
-        this.chainingStrategy = ChainingStrategy.HEAD;
+        setup(parameters.getContainingTask(), parameters.getStreamConfig(), parameters.getOutput());
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperatorFactory.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperatorFactory.java
index 7c53e01b47e65..a4c51e5b5a9be 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperatorFactory.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AppendBypassCoordinateOperatorFactory.java
@@ -45,11 +45,7 @@ T createStreamOperator(
                     StreamOperatorParameters<Either<CommitT, UnawareAppendCompactionTask>>
                             parameters) {
         AppendBypassCoordinateOperator<CommitT> operator =
-                new AppendBypassCoordinateOperator<>(table, processingTimeService);
-        operator.setup(
-                parameters.getContainingTask(),
-                parameters.getStreamConfig(),
-                parameters.getOutput());
+                new AppendBypassCoordinateOperator<>(parameters, table, processingTimeService);
         return (T) operator;
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperatorTest.java
index d589459d9b969..949c2c7a66a36 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlyMultiTableCompactionWorkerOperatorTest.java
@@ -25,7 +25,13 @@
 import org.apache.paimon.table.sink.CommitMessage;
 import org.apache.paimon.table.sink.CommitMessageImpl;
 
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.runtime.operators.testutils.DummyEnvironment;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
+import org.apache.flink.streaming.runtime.tasks.SourceOperatorStreamTask;
+import org.apache.flink.streaming.util.MockOutput;
+import org.apache.flink.streaming.util.MockStreamConfig;
 import org.assertj.core.api.Assertions;
 import org.junit.jupiter.api.Test;
 
@@ -45,8 +51,17 @@ public class AppendOnlyMultiTableCompactionWorkerOperatorTest extends TableTestB
     public void testAsyncCompactionWorks() throws Exception {
 
         AppendOnlyMultiTableCompactionWorkerOperator workerOperator =
-                new AppendOnlyMultiTableCompactionWorkerOperator(
-                        () -> catalog, "user", new Options());
+                new AppendOnlyMultiTableCompactionWorkerOperator.Factory(
+                                () -> catalog, "user", new Options())
+                        .createStreamOperator(
+                                new StreamOperatorParameters<>(
+                                        new SourceOperatorStreamTask<Integer>(
+                                                new DummyEnvironment()),
+                                        new MockStreamConfig(new Configuration(), 1),
+                                        new MockOutput<>(new ArrayList<>()),
+                                        null,
+                                        null,
+                                        null));
 
         List<StreamRecord<MultiTableUnawareAppendCompactionTask>> records = new ArrayList<>();
         // create table and write
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperatorTest.java
index d04032817cf01..6238a9cbf3ea0 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AppendOnlySingleTableCompactionWorkerOperatorTest.java
@@ -32,7 +32,13 @@
 import org.apache.paimon.table.sink.CommitMessageImpl;
 import org.apache.paimon.types.DataTypes;
 
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.runtime.operators.testutils.DummyEnvironment;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
+import org.apache.flink.streaming.runtime.tasks.SourceOperatorStreamTask;
+import org.apache.flink.streaming.util.MockOutput;
+import org.apache.flink.streaming.util.MockStreamConfig;
 import org.assertj.core.api.Assertions;
 import org.junit.jupiter.api.Test;
 
@@ -49,7 +55,16 @@ public class AppendOnlySingleTableCompactionWorkerOperatorTest extends TableTest
     public void testAsyncCompactionWorks() throws Exception {
         createTableDefault();
         AppendOnlySingleTableCompactionWorkerOperator workerOperator =
-                new AppendOnlySingleTableCompactionWorkerOperator(getTableDefault(), "user");
+                new AppendOnlySingleTableCompactionWorkerOperator.Factory(getTableDefault(), "user")
+                        .createStreamOperator(
+                                new StreamOperatorParameters<>(
+                                        new SourceOperatorStreamTask<Integer>(
+                                                new DummyEnvironment()),
+                                        new MockStreamConfig(new Configuration(), 1),
+                                        new MockOutput<>(new ArrayList<>()),
+                                        null,
+                                        null,
+                                        null));
 
         // write 200 files
         List<CommitMessage> commitMessages = writeDataDefault(200, 20);
@@ -102,7 +117,16 @@ public void testAsyncCompactionWorks() throws Exception {
     public void testAsyncCompactionFileDeletedWhenShutdown() throws Exception {
         createTableDefault();
         AppendOnlySingleTableCompactionWorkerOperator workerOperator =
-                new AppendOnlySingleTableCompactionWorkerOperator(getTableDefault(), "user");
+                new AppendOnlySingleTableCompactionWorkerOperator.Factory(getTableDefault(), "user")
+                        .createStreamOperator(
+                                new StreamOperatorParameters<>(
+                                        new SourceOperatorStreamTask<Integer>(
+                                                new DummyEnvironment()),
+                                        new MockStreamConfig(new Configuration(), 1),
+                                        new MockOutput<>(new ArrayList<>()),
+                                        null,
+                                        null,
+                                        null));
 
         // write 200 files
         List<CommitMessage> commitMessages = writeDataDefault(200, 40);
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorTest.java
index 3b58c24d16b18..ee930a06fc3d0 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/AutoTagForSavepointCommitterOperatorTest.java
@@ -32,7 +32,7 @@
 import org.apache.flink.runtime.checkpoint.OperatorSubtaskState;
 import org.apache.flink.runtime.checkpoint.SavepointType;
 import org.apache.flink.runtime.state.StateInitializationContext;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.streaming.util.OneInputStreamOperatorTestHarness;
 import org.junit.jupiter.api.Test;
 
@@ -198,13 +198,15 @@ private void processCommittable(
     }
 
     @Override
-    protected OneInputStreamOperator<Committable, Committable> createCommitterOperator(
-            FileStoreTable table,
-            String commitUser,
-            CommittableStateManager<ManifestCommittable> committableStateManager) {
-        return new AutoTagForSavepointCommitterOperator<>(
-                (CommitterOperator<Committable, ManifestCommittable>)
-                        super.createCommitterOperator(table, commitUser, committableStateManager),
+    protected OneInputStreamOperatorFactory<Committable, Committable>
+            createCommitterOperatorFactory(
+                    FileStoreTable table,
+                    String commitUser,
+                    CommittableStateManager<ManifestCommittable> committableStateManager) {
+        return new AutoTagForSavepointCommitterOperatorFactory<>(
+                (CommitterOperatorFactory<Committable, ManifestCommittable>)
+                        super.createCommitterOperatorFactory(
+                                table, commitUser, committableStateManager),
                 table::snapshotManager,
                 table::tagManager,
                 () -> table.store().newTagDeletion(),
@@ -213,14 +215,15 @@ protected OneInputStreamOperator<Committable, Committable> createCommitterOperat
     }
 
     @Override
-    protected OneInputStreamOperator<Committable, Committable> createCommitterOperator(
-            FileStoreTable table,
-            String commitUser,
-            CommittableStateManager<ManifestCommittable> committableStateManager,
-            ThrowingConsumer<StateInitializationContext, Exception> initializeFunction) {
-        return new AutoTagForSavepointCommitterOperator<>(
-                (CommitterOperator<Committable, ManifestCommittable>)
-                        super.createCommitterOperator(
+    protected OneInputStreamOperatorFactory<Committable, Committable>
+            createCommitterOperatorFactory(
+                    FileStoreTable table,
+                    String commitUser,
+                    CommittableStateManager<ManifestCommittable> committableStateManager,
+                    ThrowingConsumer<StateInitializationContext, Exception> initializeFunction) {
+        return new AutoTagForSavepointCommitterOperatorFactory<>(
+                (CommitterOperatorFactory<Committable, ManifestCommittable>)
+                        super.createCommitterOperatorFactory(
                                 table, commitUser, committableStateManager, initializeFunction),
                 table::snapshotManager,
                 table::tagManager,
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorTest.java
index 147110637aef6..68162832eac9c 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/BatchWriteGeneratorTagOperatorTest.java
@@ -27,13 +27,21 @@
 import org.apache.paimon.utils.SnapshotManager;
 import org.apache.paimon.utils.TagManager;
 
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.runtime.operators.testutils.DummyEnvironment;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
+import org.apache.flink.streaming.runtime.tasks.SourceOperatorStreamTask;
+import org.apache.flink.streaming.util.MockOutput;
+import org.apache.flink.streaming.util.MockStreamConfig;
 import org.junit.jupiter.api.Test;
 
 import java.time.Instant;
 import java.time.LocalDateTime;
 import java.time.ZoneId;
 import java.time.format.DateTimeFormatter;
+import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.Objects;
 
@@ -54,12 +62,23 @@ public void testBatchWriteGeneratorTag() throws Exception {
         StreamTableWrite write =
                 table.newStreamWriteBuilder().withCommitUser(initialCommitUser).newWrite();
 
-        OneInputStreamOperator<Committable, Committable> committerOperator =
-                createCommitterOperator(
+        OneInputStreamOperatorFactory<Committable, Committable> committerOperatorFactory =
+                createCommitterOperatorFactory(
                         table,
                         initialCommitUser,
                         new RestoreAndFailCommittableStateManager<>(
                                 ManifestCommittableSerializer::new));
+
+        OneInputStreamOperator<Committable, Committable> committerOperator =
+                committerOperatorFactory.createStreamOperator(
+                        new StreamOperatorParameters<>(
+                                new SourceOperatorStreamTask<Integer>(new DummyEnvironment()),
+                                new MockStreamConfig(new Configuration(), 1),
+                                new MockOutput<>(new ArrayList<>()),
+                                null,
+                                null,
+                                null));
+
         committerOperator.open();
 
         TableCommitImpl tableCommit = table.newCommit(initialCommitUser);
@@ -106,13 +125,15 @@ public void testBatchWriteGeneratorTag() throws Exception {
     }
 
     @Override
-    protected OneInputStreamOperator<Committable, Committable> createCommitterOperator(
-            FileStoreTable table,
-            String commitUser,
-            CommittableStateManager<ManifestCommittable> committableStateManager) {
-        return new BatchWriteGeneratorTagOperator<>(
-                (CommitterOperator<Committable, ManifestCommittable>)
-                        super.createCommitterOperator(table, commitUser, committableStateManager),
+    protected OneInputStreamOperatorFactory<Committable, Committable>
+            createCommitterOperatorFactory(
+                    FileStoreTable table,
+                    String commitUser,
+                    CommittableStateManager<ManifestCommittable> committableStateManager) {
+        return new BatchWriteGeneratorTagOperatorFactory<>(
+                (CommitterOperatorFactory<Committable, ManifestCommittable>)
+                        super.createCommitterOperatorFactory(
+                                table, commitUser, committableStateManager),
                 table);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CommitterOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CommitterOperatorTest.java
index 668d651236fdc..28c93ca79be02 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CommitterOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CommitterOperatorTest.java
@@ -51,10 +51,13 @@
 import org.apache.flink.runtime.checkpoint.OperatorSubtaskState;
 import org.apache.flink.runtime.jobgraph.OperatorID;
 import org.apache.flink.runtime.state.StateInitializationContext;
-import org.apache.flink.streaming.api.operators.OneInputStreamOperator;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
+import org.apache.flink.streaming.api.operators.StreamOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.util.AbstractStreamOperatorTestHarness;
 import org.apache.flink.streaming.util.OneInputStreamOperatorTestHarness;
+import org.apache.flink.util.Preconditions;
 import org.assertj.core.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -259,8 +262,8 @@ public void testRestoreCommitUser() throws Exception {
         // 3. Check whether success
         List<String> actual = new ArrayList<>();
 
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
                         table,
                         initialCommitUser,
                         new NoopCommittableStateManager(),
@@ -274,7 +277,7 @@ public void testRestoreCommitUser() throws Exception {
                         });
 
         OneInputStreamOperatorTestHarness<Committable, Committable> testHarness1 =
-                createTestHarness(operator);
+                createTestHarness(operatorFactory);
         testHarness1.initializeState(snapshot);
         testHarness1.close();
 
@@ -315,10 +318,11 @@ public void testRestoreEmptyMarkDoneState() throws Exception {
     public void testCommitInputEnd() throws Exception {
         FileStoreTable table = createFileStoreTable();
         String commitUser = UUID.randomUUID().toString();
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(table, commitUser, new NoopCommittableStateManager());
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
+                        table, commitUser, new NoopCommittableStateManager());
         OneInputStreamOperatorTestHarness<Committable, Committable> testHarness =
-                createTestHarness(operator);
+                createTestHarness(operatorFactory);
         testHarness.open();
         Assertions.assertThatCode(
                         () -> {
@@ -378,10 +382,10 @@ public void testCommitInputEnd() throws Exception {
                         })
                 .doesNotThrowAnyException();
 
-        if (operator instanceof CommitterOperator) {
+        if (operatorFactory instanceof CommitterOperator) {
             Assertions.assertThat(
                             ((ManifestCommittable)
-                                            ((CommitterOperator) operator)
+                                            ((CommitterOperator) operatorFactory)
                                                     .committablesPerCheckpoint.get(Long.MAX_VALUE))
                                     .fileCommittables()
                                     .size())
@@ -604,14 +608,14 @@ public void testCalcDataBytesSend() throws Exception {
     public void testCommitMetrics() throws Exception {
         FileStoreTable table = createFileStoreTable();
 
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
                         table,
                         null,
                         new RestoreAndFailCommittableStateManager<>(
                                 ManifestCommittableSerializer::new));
         OneInputStreamOperatorTestHarness<Committable, Committable> testHarness =
-                createTestHarness(operator);
+                createTestHarness(operatorFactory);
         testHarness.open();
         long timestamp = 0;
         StreamTableWrite write =
@@ -627,7 +631,9 @@ public void testCommitMetrics() throws Exception {
         testHarness.notifyOfCompletedCheckpoint(cpId);
 
         MetricGroup commitMetricGroup =
-                operator.getMetricGroup()
+                testHarness
+                        .getOneInputOperator()
+                        .getMetricGroup()
                         .addGroup("paimon")
                         .addGroup("table", table.name())
                         .addGroup("commit");
@@ -685,10 +691,11 @@ public void testCommitMetrics() throws Exception {
     public void testParallelism() throws Exception {
         FileStoreTable table = createFileStoreTable();
         String commitUser = UUID.randomUUID().toString();
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(table, commitUser, new NoopCommittableStateManager());
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
+                        table, commitUser, new NoopCommittableStateManager());
         try (OneInputStreamOperatorTestHarness<Committable, Committable> testHarness =
-                createTestHarness(operator, 10, 10, 3)) {
+                createTestHarness(operatorFactory, 10, 10, 3)) {
             Assertions.assertThatCode(testHarness::open)
                     .hasMessage("Committer Operator parallelism in paimon MUST be one.");
         }
@@ -700,13 +707,13 @@ public void testParallelism() throws Exception {
 
     protected OneInputStreamOperatorTestHarness<Committable, Committable>
             createRecoverableTestHarness(FileStoreTable table) throws Exception {
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
                         table,
                         null,
                         new RestoreAndFailCommittableStateManager<>(
                                 ManifestCommittableSerializer::new));
-        return createTestHarness(operator);
+        return createTestHarness(operatorFactory);
     }
 
     private OneInputStreamOperatorTestHarness<Committable, Committable> createLossyTestHarness(
@@ -716,18 +723,20 @@ private OneInputStreamOperatorTestHarness<Committable, Committable> createLossyT
 
     private OneInputStreamOperatorTestHarness<Committable, Committable> createLossyTestHarness(
             FileStoreTable table, String commitUser) throws Exception {
-        OneInputStreamOperator<Committable, Committable> operator =
-                createCommitterOperator(table, commitUser, new NoopCommittableStateManager());
-        return createTestHarness(operator);
+        OneInputStreamOperatorFactory<Committable, Committable> operatorFactory =
+                createCommitterOperatorFactory(
+                        table, commitUser, new NoopCommittableStateManager());
+        return createTestHarness(operatorFactory);
     }
 
     private OneInputStreamOperatorTestHarness<Committable, Committable> createTestHarness(
-            OneInputStreamOperator<Committable, Committable> operator) throws Exception {
-        return createTestHarness(operator, 1, 1, 0);
+            OneInputStreamOperatorFactory<Committable, Committable> operatorFactory)
+            throws Exception {
+        return createTestHarness(operatorFactory, 1, 1, 0);
     }
 
     private OneInputStreamOperatorTestHarness<Committable, Committable> createTestHarness(
-            OneInputStreamOperator<Committable, Committable> operator,
+            OneInputStreamOperatorFactory<Committable, Committable> operatorFactory,
             int maxParallelism,
             int parallelism,
             int subTaskIndex)
@@ -736,22 +745,23 @@ private OneInputStreamOperatorTestHarness<Committable, Committable> createTestHa
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<Committable, Committable> harness =
                 new OneInputStreamOperatorTestHarness<>(
-                        operator,
+                        operatorFactory,
                         maxParallelism,
                         parallelism,
                         subTaskIndex,
-                        serializer,
                         new OperatorID());
+        harness.getStreamConfig().setupNetworkInputs(Preconditions.checkNotNull(serializer));
+        harness.getStreamConfig().serializeAllConfigs();
         harness.setup(serializer);
         return harness;
     }
 
-    protected OneInputStreamOperator<Committable, Committable> createCommitterOperator(
-            FileStoreTable table,
-            String commitUser,
-            CommittableStateManager<ManifestCommittable> committableStateManager) {
-        return new CommitterOperator<>(
-                true,
+    protected OneInputStreamOperatorFactory<Committable, Committable>
+            createCommitterOperatorFactory(
+                    FileStoreTable table,
+                    String commitUser,
+                    CommittableStateManager<ManifestCommittable> committableStateManager) {
+        return new CommitterOperatorFactory<>(
                 true,
                 true,
                 commitUser == null ? initialCommitUser : commitUser,
@@ -765,13 +775,13 @@ protected OneInputStreamOperator<Committable, Committable> createCommitterOperat
                 committableStateManager);
     }
 
-    protected OneInputStreamOperator<Committable, Committable> createCommitterOperator(
-            FileStoreTable table,
-            String commitUser,
-            CommittableStateManager<ManifestCommittable> committableStateManager,
-            ThrowingConsumer<StateInitializationContext, Exception> initializeFunction) {
-        return new CommitterOperator<Committable, ManifestCommittable>(
-                true,
+    protected OneInputStreamOperatorFactory<Committable, Committable>
+            createCommitterOperatorFactory(
+                    FileStoreTable table,
+                    String commitUser,
+                    CommittableStateManager<ManifestCommittable> committableStateManager,
+                    ThrowingConsumer<StateInitializationContext, Exception> initializeFunction) {
+        return new CommitterOperatorFactory<Committable, ManifestCommittable>(
                 true,
                 true,
                 commitUser == null ? initialCommitUser : commitUser,
@@ -784,8 +794,24 @@ protected OneInputStreamOperator<Committable, Committable> createCommitterOperat
                                 context),
                 committableStateManager) {
             @Override
-            public void initializeState(StateInitializationContext context) throws Exception {
-                initializeFunction.accept(context);
+            @SuppressWarnings("unchecked")
+            public <T extends StreamOperator<Committable>> T createStreamOperator(
+                    StreamOperatorParameters<Committable> parameters) {
+                return (T)
+                        new CommitterOperator<Committable, ManifestCommittable>(
+                                parameters,
+                                streamingCheckpointEnabled,
+                                forceSingleParallelism,
+                                initialCommitUser,
+                                committerFactory,
+                                committableStateManager,
+                                endInputWatermark) {
+                            @Override
+                            public void initializeState(StateInitializationContext context)
+                                    throws Exception {
+                                initializeFunction.accept(context);
+                            }
+                        };
             }
         };
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
index 42293ca2842e1..d487d75925eb9 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/CompactorSinkITCase.java
@@ -254,8 +254,8 @@ private OneInputStreamOperatorTestHarness<RowData, Committable> createTestHarnes
         return harness;
     }
 
-    protected StoreCompactOperator createCompactOperator(FileStoreTable table) {
-        return new StoreCompactOperator(
+    protected StoreCompactOperator.Factory createCompactOperator(FileStoreTable table) {
+        return new StoreCompactOperator.Factory(
                 table,
                 (t, commitUser, state, ioManager, memoryPool, metricGroup) ->
                         new StoreSinkWriteImpl(
@@ -272,9 +272,9 @@ protected StoreCompactOperator createCompactOperator(FileStoreTable table) {
                 true);
     }
 
-    protected MultiTablesStoreCompactOperator createMultiTablesCompactOperator(
+    protected MultiTablesStoreCompactOperator.Factory createMultiTablesCompactOperator(
             Catalog.Loader catalogLoader) throws Exception {
-        return new MultiTablesStoreCompactOperator(
+        return new MultiTablesStoreCompactOperator.Factory(
                 catalogLoader,
                 commitUser,
                 new CheckpointConfig(),
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/FlinkSinkTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/FlinkSinkTest.java
index c335568344b32..5f21858e61a58 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/FlinkSinkTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/FlinkSinkTest.java
@@ -42,7 +42,7 @@
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.operators.SimpleOperatorFactory;
+import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.streaming.api.transformations.OneInputTransformation;
 import org.apache.flink.streaming.util.OneInputStreamOperatorTestHarness;
 import org.junit.jupiter.api.Test;
@@ -82,20 +82,22 @@ private boolean testSpillable(
                         Collections.singletonList(GenericRow.of(1, 1)));
         FlinkSink<InternalRow> flinkSink = new FixedBucketSink(fileStoreTable, null, null);
         DataStream<Committable> written = flinkSink.doWrite(source, "123", 1);
-        RowDataStoreWriteOperator operator =
-                ((RowDataStoreWriteOperator)
-                        ((SimpleOperatorFactory)
-                                        ((OneInputTransformation) written.getTransformation())
-                                                .getOperatorFactory())
-                                .getOperator());
+        OneInputStreamOperatorFactory<InternalRow, Committable> operatorFactory =
+                (OneInputStreamOperatorFactory<InternalRow, Committable>)
+                        ((OneInputTransformation<InternalRow, Committable>)
+                                        written.getTransformation())
+                                .getOperatorFactory();
 
         TypeSerializer<Committable> serializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<InternalRow, Committable> harness =
-                new OneInputStreamOperatorTestHarness<>(operator);
+                new OneInputStreamOperatorTestHarness<>(operatorFactory);
         harness.setup(serializer);
         harness.initializeEmptyState();
 
+        RowDataStoreWriteOperator operator =
+                (RowDataStoreWriteOperator) harness.getOneInputOperator();
+
         return ((KeyValueFileStoreWrite) ((StoreSinkWriteImpl) operator.write).write.getWrite())
                 .bufferSpillable();
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/LocalMergeOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/LocalMergeOperatorTest.java
index 1162e20b155b2..fc45eceb3fd5b 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/LocalMergeOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/LocalMergeOperatorTest.java
@@ -26,12 +26,18 @@
 import org.apache.paimon.types.RowKind;
 import org.apache.paimon.types.RowType;
 
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.runtime.operators.testutils.DummyEnvironment;
 import org.apache.flink.streaming.api.operators.Output;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
 import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.streaming.runtime.streamrecord.LatencyMarker;
 import org.apache.flink.streaming.runtime.streamrecord.RecordAttributes;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
+import org.apache.flink.streaming.runtime.tasks.SourceOperatorStreamTask;
 import org.apache.flink.streaming.runtime.watermarkstatus.WatermarkStatus;
+import org.apache.flink.streaming.util.MockOutput;
+import org.apache.flink.streaming.util.MockStreamConfig;
 import org.apache.flink.util.OutputTag;
 import org.junit.jupiter.api.Test;
 
@@ -151,7 +157,17 @@ private void prepareHashOperator(Map<String, String> options) throws Exception {
                         Collections.singletonList("f0"),
                         options,
                         null);
-        operator = new LocalMergeOperator(schema);
+        operator =
+                new LocalMergeOperator.Factory(schema)
+                        .createStreamOperator(
+                                new StreamOperatorParameters<>(
+                                        new SourceOperatorStreamTask<Integer>(
+                                                new DummyEnvironment()),
+                                        new MockStreamConfig(new Configuration(), 1),
+                                        new MockOutput<>(new ArrayList<>()),
+                                        null,
+                                        null,
+                                        null));
         operator.open();
         assertThat(operator.merger()).isInstanceOf(HashMapLocalMerger.class);
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
index f8387e1fc41a0..3740033e025e9 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreCompactOperatorTest.java
@@ -48,8 +48,8 @@ public void testCompactExactlyOnce(boolean streamingMode) throws Exception {
 
         CompactRememberStoreWrite compactRememberStoreWrite =
                 new CompactRememberStoreWrite(streamingMode);
-        StoreCompactOperator operator =
-                new StoreCompactOperator(
+        StoreCompactOperator.Factory operatorFactory =
+                new StoreCompactOperator.Factory(
                         getTableDefault(),
                         (table, commitUser, state, ioManager, memoryPool, metricGroup) ->
                                 compactRememberStoreWrite,
@@ -59,7 +59,7 @@ public void testCompactExactlyOnce(boolean streamingMode) throws Exception {
         TypeSerializer<Committable> serializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<RowData, Committable> harness =
-                new OneInputStreamOperatorTestHarness<>(operator);
+                new OneInputStreamOperatorTestHarness<>(operatorFactory);
         harness.setup(serializer);
         harness.initializeEmptyState();
         harness.open();
@@ -70,7 +70,7 @@ public void testCompactExactlyOnce(boolean streamingMode) throws Exception {
         harness.processElement(new StreamRecord<>(data(1)));
         harness.processElement(new StreamRecord<>(data(2)));
 
-        operator.prepareCommit(true, 1);
+        ((StoreCompactOperator) harness.getOneInputOperator()).prepareCommit(true, 1);
         Assertions.assertThat(compactRememberStoreWrite.compactTime).isEqualTo(3);
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreMultiCommitterTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreMultiCommitterTest.java
index 10e432f3c8c21..752679fb59037 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreMultiCommitterTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/StoreMultiCommitterTest.java
@@ -645,11 +645,10 @@ public void testCommitMetrics() throws Exception {
 
     private OneInputStreamOperatorTestHarness<MultiTableCommittable, MultiTableCommittable>
             createRecoverableTestHarness() throws Exception {
-        CommitterOperator<MultiTableCommittable, WrappedManifestCommittable> operator =
-                new CommitterOperator<>(
+        CommitterOperatorFactory<MultiTableCommittable, WrappedManifestCommittable> operator =
+                new CommitterOperatorFactory<>(
                         true,
                         false,
-                        true,
                         initialCommitUser,
                         context -> new StoreMultiCommitter(catalogLoader, context),
                         new RestoreAndFailCommittableStateManager<>(
@@ -659,11 +658,10 @@ public void testCommitMetrics() throws Exception {
 
     private OneInputStreamOperatorTestHarness<MultiTableCommittable, MultiTableCommittable>
             createLossyTestHarness() throws Exception {
-        CommitterOperator<MultiTableCommittable, WrappedManifestCommittable> operator =
-                new CommitterOperator<>(
+        CommitterOperatorFactory<MultiTableCommittable, WrappedManifestCommittable> operator =
+                new CommitterOperatorFactory<>(
                         true,
                         false,
-                        true,
                         initialCommitUser,
                         context -> new StoreMultiCommitter(catalogLoader, context),
                         new CommittableStateManager<WrappedManifestCommittable>() {
@@ -682,12 +680,13 @@ public void snapshotState(
 
     private OneInputStreamOperatorTestHarness<MultiTableCommittable, MultiTableCommittable>
             createTestHarness(
-                    CommitterOperator<MultiTableCommittable, WrappedManifestCommittable> operator)
+                    CommitterOperatorFactory<MultiTableCommittable, WrappedManifestCommittable>
+                            operatorFactory)
                     throws Exception {
         TypeSerializer<MultiTableCommittable> serializer =
                 new MultiTableCommittableTypeInfo().createSerializer(new ExecutionConfig());
         OneInputStreamOperatorTestHarness<MultiTableCommittable, MultiTableCommittable> harness =
-                new OneInputStreamOperatorTestHarness<>(operator, serializer);
+                new OneInputStreamOperatorTestHarness<>(operatorFactory, serializer);
         harness.setup(serializer);
         return harness;
     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java
new file mode 100644
index 0000000000000..a4605b830918e
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java
@@ -0,0 +1,203 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.sink;
+
+import org.apache.flink.api.dag.Transformation;
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.runtime.jobgraph.JobVertex;
+import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
+import org.apache.flink.table.api.CompiledPlan;
+import org.apache.flink.table.api.bridge.java.StreamTableEnvironment;
+import org.apache.flink.table.api.internal.CompiledPlanUtils;
+import org.apache.flink.util.TimeUtils;
+import org.junit.jupiter.api.BeforeEach;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.io.TempDir;
+
+import java.time.Duration;
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.stream.Collectors;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * Tests for {@link org.apache.flink.streaming.api.operators.ChainingStrategy} of writer operators.
+ */
+public class WriterChainingStrategyTest {
+    private static final String TABLE_NAME = "paimon_table";
+
+    @TempDir java.nio.file.Path tempDir;
+
+    private StreamTableEnvironment tEnv;
+
+    @BeforeEach
+    public void beforeEach() {
+        Configuration config = new Configuration();
+        config.setString(
+                "execution.checkpointing.interval",
+                TimeUtils.formatWithHighestUnit(Duration.ofMillis(500)));
+        StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(config);
+        tEnv = StreamTableEnvironment.create(env);
+
+        String catalog = "PAIMON";
+        Map<String, String> options = new HashMap<>();
+        options.put("type", "paimon");
+        options.put("warehouse", tempDir.toString());
+        tEnv.executeSql(
+                String.format(
+                        "CREATE CATALOG %s WITH ( %s )",
+                        catalog,
+                        options.entrySet().stream()
+                                .map(e -> String.format("'%s'='%s'", e.getKey(), e.getValue()))
+                                .collect(Collectors.joining(","))));
+        tEnv.useCatalog(catalog);
+    }
+
+    @Test
+    public void testAppendTable() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING) "
+                                        + "WITH ('bucket' = '1', 'bucket-key'='id', 'write-only' = 'true')",
+                                TABLE_NAME))
+                .await();
+
+        verifyChaining(false, true);
+    }
+
+    @Test
+    public void testAppendTableWithUnawareBucket() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING) "
+                                        + "WITH ('bucket' = '-1', 'write-only' = 'true')",
+                                TABLE_NAME))
+                .await();
+
+        verifyChaining(true, true);
+    }
+
+    @Test
+    public void testPrimaryKeyTable() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING, PRIMARY KEY (id) NOT ENFORCED) "
+                                        + "WITH ('bucket' = '1', 'bucket-key'='id', 'write-only' = 'true')",
+                                TABLE_NAME))
+                .await();
+
+        verifyChaining(false, true);
+    }
+
+    @Test
+    public void testPrimaryKeyTableWithDynamicBucket() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING, PRIMARY KEY (id) NOT ENFORCED) "
+                                        + "WITH ('bucket' = '-1', 'write-only' = 'true')",
+                                TABLE_NAME))
+                .await();
+
+        verifyChaining(false, true);
+    }
+
+    @Test
+    public void testPrimaryKeyTableWithMultipleWriter() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING, PRIMARY KEY (id) NOT ENFORCED) "
+                                        + "WITH ('bucket' = '1', 'bucket-key'='id', 'write-only' = 'true', 'sink.parallelism' = '2')",
+                                TABLE_NAME))
+                .await();
+
+        verifyChaining(false, false);
+    }
+
+    @Test
+    public void testPrimaryKeyTableWithCrossPartitionUpdate() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING, PRIMARY KEY (id) NOT ENFORCED) "
+                                        + "PARTITIONED BY ( dt ) WITH ('bucket' = '-1', 'write-only' = 'true')",
+                                TABLE_NAME))
+                .await();
+
+        List<JobVertex> vertices = verifyChaining(false, true);
+        JobVertex vertex = findVertex(vertices, "INDEX_BOOTSTRAP");
+        assertThat(vertex.toString()).contains("Source");
+    }
+
+    @Test
+    public void testPrimaryKeyTableWithLocalMerge() throws Exception {
+        tEnv.executeSql(
+                        String.format(
+                                "CREATE TABLE %s (id INT, data STRING, dt STRING, PRIMARY KEY (id) NOT ENFORCED) "
+                                        + "WITH ('bucket' = '-1', 'write-only' = 'true', 'local-merge-buffer-size' = '1MB')",
+                                TABLE_NAME))
+                .await();
+
+        List<JobVertex> vertices = verifyChaining(false, true);
+        JobVertex vertex = findVertex(vertices, "local merge");
+        assertThat(vertex.toString()).contains("Source");
+    }
+
+    private List<JobVertex> verifyChaining(
+            boolean isWriterChainedWithUpstream, boolean isWriterChainedWithDownStream) {
+        CompiledPlan plan =
+                tEnv.compilePlanSql(
+                        String.format(
+                                "INSERT INTO %s VALUES (1, 'AAA', ''), (2, 'BBB', '')",
+                                TABLE_NAME));
+        List<Transformation<?>> transformations = CompiledPlanUtils.toTransformations(tEnv, plan);
+        StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
+        transformations.forEach(env::addOperator);
+
+        List<JobVertex> vertices = new ArrayList<>();
+        env.getStreamGraph().getJobGraph().getVertices().forEach(vertices::add);
+        JobVertex vertex = findVertex(vertices, "Writer");
+
+        if (isWriterChainedWithUpstream) {
+            assertThat(vertex.toString()).contains("Source");
+        } else {
+            assertThat(vertex.toString()).doesNotContain("Source");
+        }
+
+        if (isWriterChainedWithDownStream) {
+            assertThat(vertex.toString()).contains("Committer");
+        } else {
+            assertThat(vertex.toString()).doesNotContain("Committer");
+        }
+
+        return vertices;
+    }
+
+    private JobVertex findVertex(List<JobVertex> vertices, String key) {
+        for (JobVertex vertex : vertices) {
+            if (vertex.toString().contains(key)) {
+                return vertex;
+            }
+        }
+        throw new IllegalStateException(
+                String.format(
+                        "Cannot find vertex with keyword %s among job vertices %s", key, vertices));
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterOperatorTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterOperatorTest.java
index 3a8c1557122f7..83af157450780 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterOperatorTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterOperatorTest.java
@@ -115,9 +115,10 @@ public void testAppendOnlyTableMetrics() throws Exception {
 
     private void testMetricsImpl(FileStoreTable fileStoreTable) throws Exception {
         String tableName = tablePath.getName();
-        RowDataStoreWriteOperator operator = getStoreSinkWriteOperator(fileStoreTable);
+        RowDataStoreWriteOperator.Factory operatorFactory =
+                getStoreSinkWriteOperatorFactory(fileStoreTable);
         OneInputStreamOperatorTestHarness<InternalRow, Committable> harness =
-                createHarness(operator);
+                createHarness(operatorFactory);
 
         TypeSerializer<Committable> serializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
@@ -133,7 +134,7 @@ private void testMetricsImpl(FileStoreTable fileStoreTable) throws Exception {
         harness.snapshot(1, 2);
         harness.notifyOfCompletedCheckpoint(1);
 
-        OperatorMetricGroup metricGroup = operator.getMetricGroup();
+        OperatorMetricGroup metricGroup = harness.getOneInputOperator().getMetricGroup();
         MetricGroup writerBufferMetricGroup =
                 metricGroup
                         .addGroup("paimon")
@@ -173,9 +174,10 @@ public void testAsyncLookupWithFailure() throws Exception {
                         rowType, Arrays.asList("pt", "k"), Collections.singletonList("k"), options);
 
         // we don't wait for compaction because this is async lookup test
-        RowDataStoreWriteOperator operator = getAsyncLookupWriteOperator(fileStoreTable, false);
+        RowDataStoreWriteOperator.Factory operatorFactory =
+                getAsyncLookupWriteOperatorFactory(fileStoreTable, false);
         OneInputStreamOperatorTestHarness<InternalRow, Committable> harness =
-                createHarness(operator);
+                createHarness(operatorFactory);
 
         TableCommitImpl commit = fileStoreTable.newCommit(commitUser);
 
@@ -205,8 +207,8 @@ public void testAsyncLookupWithFailure() throws Exception {
         harness.close();
 
         // re-create operator from state, this time wait for compaction to check result
-        operator = getAsyncLookupWriteOperator(fileStoreTable, true);
-        harness = createHarness(operator);
+        operatorFactory = getAsyncLookupWriteOperatorFactory(fileStoreTable, true);
+        harness = createHarness(operatorFactory);
         harness.setup(serializer);
         harness.initializeState(state);
         harness.open();
@@ -263,9 +265,10 @@ private void testChangelog(boolean insertOnly) throws Exception {
         FileStoreTable fileStoreTable =
                 createFileStoreTable(
                         rowType, Arrays.asList("pt", "k"), Collections.singletonList("k"), options);
-        RowDataStoreWriteOperator operator = getStoreSinkWriteOperator(fileStoreTable);
+        RowDataStoreWriteOperator.Factory operatorFactory =
+                getStoreSinkWriteOperatorFactory(fileStoreTable);
         OneInputStreamOperatorTestHarness<InternalRow, Committable> harness =
-                createHarness(operator);
+                createHarness(operatorFactory);
 
         TableCommitImpl commit = fileStoreTable.newCommit(commitUser);
 
@@ -277,7 +280,7 @@ private void testChangelog(boolean insertOnly) throws Exception {
         if (insertOnly) {
             Field field = TableWriteOperator.class.getDeclaredField("write");
             field.setAccessible(true);
-            StoreSinkWrite write = (StoreSinkWrite) field.get(operator);
+            StoreSinkWrite write = (StoreSinkWrite) field.get(harness.getOneInputOperator());
             write.withInsertOnly(true);
         }
 
@@ -339,17 +342,17 @@ public void testNumWritersMetric() throws Exception {
                         options);
         TableCommitImpl commit = fileStoreTable.newCommit(commitUser);
 
-        RowDataStoreWriteOperator rowDataStoreWriteOperator =
-                getStoreSinkWriteOperator(fileStoreTable);
+        RowDataStoreWriteOperator.Factory operatorFactory =
+                getStoreSinkWriteOperatorFactory(fileStoreTable);
         OneInputStreamOperatorTestHarness<InternalRow, Committable> harness =
-                createHarness(rowDataStoreWriteOperator);
+                createHarness(operatorFactory);
 
         TypeSerializer<Committable> serializer =
                 new CommittableTypeInfo().createSerializer(new ExecutionConfig());
         harness.setup(serializer);
         harness.open();
 
-        OperatorMetricGroup metricGroup = rowDataStoreWriteOperator.getMetricGroup();
+        OperatorMetricGroup metricGroup = harness.getOneInputOperator().getMetricGroup();
         MetricGroup writerBufferMetricGroup =
                 metricGroup
                         .addGroup("paimon")
@@ -408,8 +411,9 @@ public void testNumWritersMetric() throws Exception {
     //  Test utils
     // ------------------------------------------------------------------------
 
-    private RowDataStoreWriteOperator getStoreSinkWriteOperator(FileStoreTable fileStoreTable) {
-        return new RowDataStoreWriteOperator(
+    private RowDataStoreWriteOperator.Factory getStoreSinkWriteOperatorFactory(
+            FileStoreTable fileStoreTable) {
+        return new RowDataStoreWriteOperator.Factory(
                 fileStoreTable,
                 null,
                 (table, commitUser, state, ioManager, memoryPool, metricGroup) ->
@@ -426,9 +430,9 @@ private RowDataStoreWriteOperator getStoreSinkWriteOperator(FileStoreTable fileS
                 commitUser);
     }
 
-    private RowDataStoreWriteOperator getAsyncLookupWriteOperator(
+    private RowDataStoreWriteOperator.Factory getAsyncLookupWriteOperatorFactory(
             FileStoreTable fileStoreTable, boolean waitCompaction) {
-        return new RowDataStoreWriteOperator(
+        return new RowDataStoreWriteOperator.Factory(
                 fileStoreTable,
                 null,
                 (table, commitUser, state, ioManager, memoryPool, metricGroup) ->
@@ -471,10 +475,11 @@ private FileStoreTable createFileStoreTable(
     }
 
     private OneInputStreamOperatorTestHarness<InternalRow, Committable> createHarness(
-            RowDataStoreWriteOperator operator) throws Exception {
+            RowDataStoreWriteOperator.Factory operatorFactory) throws Exception {
         InternalTypeInfo<InternalRow> internalRowInternalTypeInfo =
                 new InternalTypeInfo<>(new InternalRowTypeSerializer(RowType.builder().build()));
         return new OneInputStreamOperatorTestHarness<>(
-                operator, internalRowInternalTypeInfo.createSerializer(new ExecutionConfig()));
+                operatorFactory,
+                internalRowInternalTypeInfo.createSerializer(new ExecutionConfig()));
     }
 }

From db37d46f835c4a591492409483b5027ea395ba64 Mon Sep 17 00:00:00 2001
From: herefree <841043203@qq.com>
Date: Sun, 1 Dec 2024 19:39:28 +0800
Subject: [PATCH 084/157] [rest] change JsonProperty import path (#4609)

---
 .../java/org/apache/paimon/rest/responses/ConfigResponse.java   | 2 +-
 .../java/org/apache/paimon/rest/responses/ErrorResponse.java    | 2 +-
 .../src/test/java/org/apache/paimon/rest/MockRESTData.java      | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
index e6bc934703642..903cfc84b46d8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
@@ -21,11 +21,11 @@
 import org.apache.paimon.rest.RESTResponse;
 import org.apache.paimon.utils.Preconditions;
 
-import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
 import org.apache.paimon.shade.guava30.com.google.common.collect.Maps;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
 import java.beans.ConstructorProperties;
 import java.util.Map;
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
index 0e4b234867329..685fe53071b66 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
@@ -18,8 +18,8 @@
 
 package org.apache.paimon.rest.responses;
 
-import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
 import java.beans.ConstructorProperties;
 import java.io.PrintWriter;
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
index 55c5165ada48e..9b7f1003e76fd 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTData.java
@@ -18,9 +18,9 @@
 
 package org.apache.paimon.rest;
 
-import org.apache.paimon.shade.com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
 import java.beans.ConstructorProperties;
 

From e72c06ce489e54272f02dbaa555a5c31d7c36c40 Mon Sep 17 00:00:00 2001
From: Steven <54518670+yangjf2019@users.noreply.github.com>
Date: Sun, 1 Dec 2024 19:40:14 +0800
Subject: [PATCH 085/157] [doc] fix url links in documentation (#4610)

---
 docs/content/concepts/table-types.md       | 2 +-
 docs/content/engines/doris.md              | 4 ++--
 docs/content/engines/starrocks.md          | 2 +-
 docs/content/primary-key-table/overview.md | 2 +-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/content/concepts/table-types.md b/docs/content/concepts/table-types.md
index 58199031b6e7d..b5a1fafa3da1f 100644
--- a/docs/content/concepts/table-types.md
+++ b/docs/content/concepts/table-types.md
@@ -33,7 +33,7 @@ Paimon supports table types:
 3. view: metastore required, views in SQL are a kind of virtual table
 4. format-table: file format table refers to a directory that contains multiple files of the same format, where
    operations on this table allow for reading or writing to these files, compatible with Hive tables
-5. object table: provides metadata indexes for unstructured data objects in the specified Object Storage storage directory.
+5. object table: provides metadata indexes for unstructured data objects in the specified Object Storage directory.
 6. materialized-table: aimed at simplifying both batch and stream data pipelines, providing a consistent development
    experience, see [Flink Materialized Table](https://nightlies.apache.org/flink/flink-docs-master/docs/dev/table/materialized-table/overview/)
 
diff --git a/docs/content/engines/doris.md b/docs/content/engines/doris.md
index cd778cd577979..6d22bc376a885 100644
--- a/docs/content/engines/doris.md
+++ b/docs/content/engines/doris.md
@@ -89,11 +89,11 @@ See [Apache Doris Website](https://doris.apache.org/docs/lakehouse/datalake-anal
 
 - Read optimized for Primary Key Table
 
-    Doris can utilize the [Read optimized](https://paimon.apache.org/releases/release-0.6/#read-optimized) feature for Primary Key Table(release in Paimon 0.6), by reading base data files using native Parquet/ORC reader and delta file using JNI.
+    Doris can utilize the [Read optimized](https://paimon.apache.org/docs/0.8/primary-key-table/read-optimized/) feature for Primary Key Table(release in Paimon 0.6), by reading base data files using native Parquet/ORC reader and delta file using JNI.
 
 - Deletion Vectors
 
-    Doris(2.1.4+) natively supports [Deletion Vectors](https://paimon.apache.org/releases/release-0.8/#deletion-vectors)(released in Paimon 0.8).
+    Doris(2.1.4+) natively supports [Deletion Vectors](https://paimon.apache.org/docs/0.8/primary-key-table/deletion-vectors/)(released in Paimon 0.8).
 
 ## Doris to Paimon type mapping
 
diff --git a/docs/content/engines/starrocks.md b/docs/content/engines/starrocks.md
index 1ab821a9a1033..dda22d35f76a3 100644
--- a/docs/content/engines/starrocks.md
+++ b/docs/content/engines/starrocks.md
@@ -81,7 +81,7 @@ SELECT * FROM paimon_catalog.test_db.partition_tbl$partitions;
 ## StarRocks to Paimon type mapping
 
 This section lists all supported type conversion between StarRocks and Paimon. 
-All StarRocks’s data types can be found in this doc [StarRocks Data type overview](https://docs.starrocks.io/docs/sql-reference/data-types/data-type-list/).
+All StarRocks’s data types can be found in this doc [StarRocks Data type overview](https://docs.starrocks.io/docs/sql-reference/data-types/).
 
 <table class="table table-bordered">
     <thead>
diff --git a/docs/content/primary-key-table/overview.md b/docs/content/primary-key-table/overview.md
index 508b990abc596..552d60eff6deb 100644
--- a/docs/content/primary-key-table/overview.md
+++ b/docs/content/primary-key-table/overview.md
@@ -56,6 +56,6 @@ Records within a data file are sorted by their primary keys. Within a sorted run
 
 {{< img src="/img/sorted-runs.png">}}
 
-As you can see, different sorted runs may have overlapping primary key ranges, and may even contain the same primary key. When querying the LSM tree, all sorted runs must be combined and all records with the same primary key must be merged according to the user-specified [merge engine]({{< ref "primary-key-table/merge-engine" >}}) and the timestamp of each record.
+As you can see, different sorted runs may have overlapping primary key ranges, and may even contain the same primary key. When querying the LSM tree, all sorted runs must be combined and all records with the same primary key must be merged according to the user-specified [merge engine]({{< ref "primary-key-table/merge-engine/overview" >}}) and the timestamp of each record.
 
 New records written into the LSM tree will be first buffered in memory. When the memory buffer is full, all records in memory will be sorted and flushed to disk. A new sorted run is now created.

From 77b7d8d4dc11cdb5b4b86712faa1e8d37e30af86 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Mon, 2 Dec 2024 15:41:03 +0800
Subject: [PATCH 086/157] [spark] Support changing column types in
 array<struct> or map<?,struct> (#4618)

---
 .../apache/paimon/schema/SchemaManager.java   |  23 +-
 .../paimon/schema/SchemaManagerTest.java      |   8 +-
 .../org/apache/paimon/flink/FlinkCatalog.java |  10 +-
 .../spark/SparkSchemaEvolutionITCase.java     | 224 ++++++++++++++++++
 4 files changed, 253 insertions(+), 12 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index d827ffd0fb66b..83ddbccfef987 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -639,9 +639,10 @@ public void updateIntermediateColumn(List<DataField> newFields, int depth)
 
                 String fullFieldName =
                         String.join(".", Arrays.asList(updateFieldNames).subList(0, depth + 1));
-                List<DataField> nestedFields =
-                        new ArrayList<>(extractRowType(field.type(), fullFieldName).getFields());
-                updateIntermediateColumn(nestedFields, depth + 1);
+                List<DataField> nestedFields = new ArrayList<>();
+                int newDepth =
+                        depth + extractRowDataFields(field.type(), fullFieldName, nestedFields);
+                updateIntermediateColumn(nestedFields, newDepth);
                 newFields.set(
                         i,
                         new DataField(
@@ -657,14 +658,22 @@ public void updateIntermediateColumn(List<DataField> newFields, int depth)
                     String.join(".", Arrays.asList(updateFieldNames).subList(0, depth + 1)));
         }
 
-        private RowType extractRowType(DataType type, String fullFieldName) {
+        private int extractRowDataFields(
+                DataType type, String fullFieldName, List<DataField> nestedFields) {
             switch (type.getTypeRoot()) {
                 case ROW:
-                    return (RowType) type;
+                    nestedFields.addAll(((RowType) type).getFields());
+                    return 1;
                 case ARRAY:
-                    return extractRowType(((ArrayType) type).getElementType(), fullFieldName);
+                    return extractRowDataFields(
+                                    ((ArrayType) type).getElementType(),
+                                    fullFieldName,
+                                    nestedFields)
+                            + 1;
                 case MAP:
-                    return extractRowType(((MapType) type).getValueType(), fullFieldName);
+                    return extractRowDataFields(
+                                    ((MapType) type).getValueType(), fullFieldName, nestedFields)
+                            + 1;
                 default:
                     throw new IllegalArgumentException(
                             fullFieldName + " is not a structured type.");
diff --git a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
index f0d6543699659..c8b102b3584dc 100644
--- a/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/schema/SchemaManagerTest.java
@@ -738,13 +738,15 @@ public void testUpdateRowTypeInArrayAndMap() throws Exception {
 
         SchemaChange addColumn =
                 SchemaChange.addColumn(
-                        new String[] {"v", "f3"},
+                        new String[] {"v", "element", "value", "f3"},
                         DataTypes.STRING(),
                         null,
                         SchemaChange.Move.first("f3"));
-        SchemaChange dropColumn = SchemaChange.dropColumn(new String[] {"v", "f2"});
+        SchemaChange dropColumn =
+                SchemaChange.dropColumn(new String[] {"v", "element", "value", "f2"});
         SchemaChange updateColumnType =
-                SchemaChange.updateColumnType(new String[] {"v", "f1"}, DataTypes.BIGINT(), false);
+                SchemaChange.updateColumnType(
+                        new String[] {"v", "element", "value", "f1"}, DataTypes.BIGINT(), false);
         manager.commitChanges(addColumn, dropColumn, updateColumnType);
 
         innerType =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
index 09fc0328ef655..c67e79c1c06b7 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
@@ -756,8 +756,11 @@ private void generateNestedColumnUpdates(
                     "Column %s can only be updated to array type, and cannot be updated to %s type",
                     joinedNames,
                     newType);
+            List<String> fullFieldNames = new ArrayList<>(fieldNames);
+            // add a dummy column name indicating the element of array
+            fullFieldNames.add("element");
             generateNestedColumnUpdates(
-                    fieldNames,
+                    fullFieldNames,
                     ((org.apache.paimon.types.ArrayType) oldType).getElementType(),
                     ((org.apache.paimon.types.ArrayType) newType).getElementType(),
                     schemaChanges);
@@ -775,8 +778,11 @@ private void generateNestedColumnUpdates(
                     joinedNames,
                     oldMapType.getKeyType(),
                     newMapType.getKeyType());
+            List<String> fullFieldNames = new ArrayList<>(fieldNames);
+            // add a dummy column name indicating the value of map
+            fullFieldNames.add("value");
             generateNestedColumnUpdates(
-                    fieldNames,
+                    fullFieldNames,
                     oldMapType.getValueType(),
                     newMapType.getValueType(),
                     schemaChanges);
diff --git a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
index 771ddc62878d1..fb4dab38ed940 100644
--- a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
+++ b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkSchemaEvolutionITCase.java
@@ -789,6 +789,89 @@ public void testAddAndDropNestedColumn(String formatType) {
                         "[5,[53,[503,500.03,5003],five]]");
     }
 
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testAddAndDropNestedColumnInArray(String formatType) {
+        String tableName = "testAddNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v ARRAY<STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('bucket' = '1', 'primary-key' = 'k', 'file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, ARRAY(STRUCT('apple', 100), STRUCT('banana', 101))), "
+                        + "(2, ARRAY(STRUCT('cat', 200), STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT * FROM paimon.default." + tableName).collectAsList()
+                                .stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "[1,WrappedArray([apple,100], [banana,101])]",
+                        "[2,WrappedArray([cat,200], [dog,201])]");
+
+        spark.sql(
+                "ALTER TABLE paimon.default."
+                        + tableName
+                        + " ADD COLUMN v.element.f3 STRING AFTER f2");
+        spark.sql("ALTER TABLE paimon.default." + tableName + " DROP COLUMN v.element.f1");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, ARRAY(STRUCT(110, 'APPLE'), STRUCT(111, 'BANANA'))), "
+                        + "(3, ARRAY(STRUCT(310, 'FLOWER')))");
+        assertThat(
+                        spark.sql("SELECT * FROM paimon.default." + tableName).collectAsList()
+                                .stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "[1,WrappedArray([110,APPLE], [111,BANANA])]",
+                        "[2,WrappedArray([200,null], [201,null])]",
+                        "[3,WrappedArray([310,FLOWER])]");
+    }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testAddAndDropNestedColumnInMap(String formatType) {
+        String tableName = "testAddNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v MAP<INT, STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('bucket' = '1', 'primary-key' = 'k', 'file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, MAP(10, STRUCT('apple', 100), 20, STRUCT('banana', 101))), "
+                        + "(2, MAP(10, STRUCT('cat', 200), 20, STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT k, v[10].f1, v[10].f2 FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[1,apple,100]", "[2,cat,200]");
+
+        spark.sql(
+                "ALTER TABLE paimon.default."
+                        + tableName
+                        + " ADD COLUMN v.value.f3 STRING AFTER f2");
+        spark.sql("ALTER TABLE paimon.default." + tableName + " DROP COLUMN v.value.f1");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, MAP(10, STRUCT(110, 'APPLE'), 20, STRUCT(111, 'BANANA'))), "
+                        + "(3, MAP(10, STRUCT(310, 'FLOWER')))");
+        assertThat(
+                        spark.sql("SELECT k, v[10].f2, v[10].f3 FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[1,110,APPLE]", "[2,200,null]", "[3,310,FLOWER]");
+    }
+
     @ParameterizedTest()
     @ValueSource(strings = {"orc", "avro", "parquet"})
     public void testRenameNestedColumn(String formatType) {
@@ -818,6 +901,67 @@ public void testRenameNestedColumn(String formatType) {
                 .containsExactlyInAnyOrder("[apple,1]", "[banana,2]");
     }
 
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testRenameNestedColumnInArray(String formatType) {
+        String tableName = "testRenameNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v ARRAY<STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, ARRAY(STRUCT('apple', 100), STRUCT('banana', 101))), "
+                        + "(2, ARRAY(STRUCT('cat', 200), STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT v[0].f1, k FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[apple,1]", "[cat,2]");
+
+        spark.sql(
+                "ALTER TABLE paimon.default." + tableName + " RENAME COLUMN v.element.f1 to f100");
+        assertThat(
+                        spark.sql("SELECT v[0].f100, k FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[apple,1]", "[cat,2]");
+    }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testRenameNestedColumnInMap(String formatType) {
+        String tableName = "testRenameNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v MAP<INT, STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, MAP(10, STRUCT('apple', 100), 20, STRUCT('banana', 101))), "
+                        + "(2, MAP(10, STRUCT('cat', 200), 20, STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT v[10].f1, k FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[apple,1]", "[cat,2]");
+
+        spark.sql("ALTER TABLE paimon.default." + tableName + " RENAME COLUMN v.value.f1 to f100");
+        assertThat(
+                        spark.sql("SELECT v[10].f100, k FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[apple,1]", "[cat,2]");
+    }
+
     @ParameterizedTest()
     @ValueSource(strings = {"orc", "avro", "parquet"})
     public void testUpdateNestedColumnType(String formatType) {
@@ -850,4 +994,84 @@ public void testUpdateNestedColumnType(String formatType) {
                                 .map(Row::toString))
                 .containsExactlyInAnyOrder("[101,1]", "[200,2]", "[3000000000000,3]");
     }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testUpdateNestedColumnTypeInArray(String formatType) {
+        String tableName = "testRenameNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v ARRAY<STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('bucket' = '1', 'primary-key' = 'k', 'file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, ARRAY(STRUCT('apple', 100), STRUCT('banana', 101))), "
+                        + "(2, ARRAY(STRUCT('cat', 200), STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT * FROM paimon.default." + tableName).collectAsList()
+                                .stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "[1,WrappedArray([apple,100], [banana,101])]",
+                        "[2,WrappedArray([cat,200], [dog,201])]");
+
+        spark.sql(
+                "ALTER TABLE paimon.default."
+                        + tableName
+                        + " CHANGE COLUMN v.element.f2 f2 BIGINT");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, ARRAY(STRUCT('APPLE', 1000000000000), STRUCT('BANANA', 111))), "
+                        + "(3, ARRAY(STRUCT('FLOWER', 3000000000000)))");
+        assertThat(
+                        spark.sql("SELECT * FROM paimon.default." + tableName).collectAsList()
+                                .stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "[1,WrappedArray([APPLE,1000000000000], [BANANA,111])]",
+                        "[2,WrappedArray([cat,200], [dog,201])]",
+                        "[3,WrappedArray([FLOWER,3000000000000])]");
+    }
+
+    @ParameterizedTest()
+    @ValueSource(strings = {"orc", "avro", "parquet"})
+    public void testUpdateNestedColumnTypeInMap(String formatType) {
+        String tableName = "testRenameNestedColumnTable";
+        spark.sql(
+                "CREATE TABLE paimon.default."
+                        + tableName
+                        + " (k INT NOT NULL, v MAP<INT, STRUCT<f1: STRING, f2: INT>>) "
+                        + "TBLPROPERTIES ('bucket' = '1', 'primary-key' = 'k', 'file.format' = '"
+                        + formatType
+                        + "')");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, MAP(10, STRUCT('apple', 100), 20, STRUCT('banana', 101))), "
+                        + "(2, MAP(10, STRUCT('cat', 200), 20, STRUCT('dog', 201)))");
+        assertThat(
+                        spark.sql("SELECT k, v[10].f1, v[10].f2 FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder("[1,apple,100]", "[2,cat,200]");
+
+        spark.sql(
+                "ALTER TABLE paimon.default." + tableName + " CHANGE COLUMN v.value.f2 f2 BIGINT");
+        spark.sql(
+                "INSERT INTO paimon.default."
+                        + tableName
+                        + " VALUES (1, MAP(10, STRUCT('APPLE', 1000000000000), 20, STRUCT('BANANA', 111))), "
+                        + "(3, MAP(10, STRUCT('FLOWER', 3000000000000)))");
+        assertThat(
+                        spark.sql("SELECT k, v[10].f1, v[10].f2 FROM paimon.default." + tableName)
+                                .collectAsList().stream()
+                                .map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "[1,APPLE,1000000000000]", "[2,cat,200]", "[3,FLOWER,3000000000000]");
+    }
 }

From 6f967b4db5ca69d9ca530195bfc56e461b1719c6 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 2 Dec 2024 15:43:53 +0800
Subject: [PATCH 087/157] [core] Make metadata.stats-dense-store default value
 is true (#4617)

---
 docs/content/flink/sql-ddl.md                 |  4 +-
 .../generated/core_configuration.html         |  4 +-
 .../java/org/apache/paimon/CoreOptions.java   |  6 +--
 .../apache/paimon/stats/StatsTableTest.java   | 52 ++++++++++++++++++-
 .../table/AppendOnlyFileStoreTableTest.java   |  1 -
 .../table/PrimaryKeyFileStoreTableTest.java   |  2 -
 6 files changed, 58 insertions(+), 11 deletions(-)

diff --git a/docs/content/flink/sql-ddl.md b/docs/content/flink/sql-ddl.md
index 0324e6655689a..8b8c069229aae 100644
--- a/docs/content/flink/sql-ddl.md
+++ b/docs/content/flink/sql-ddl.md
@@ -203,8 +203,8 @@ Paimon will automatically collect the statistics of the data file for speeding u
 The statistics collector mode can be configured by `'metadata.stats-mode'`, by default is `'truncate(16)'`.
 You can configure the field level by setting `'fields.{field_name}.stats-mode'`.
 
-For the stats mode of `none`, we suggest that you configure `metadata.stats-dense-store` = `true`, which will
-significantly reduce the storage size of the manifest.
+For the stats mode of `none`, by default `metadata.stats-dense-store` is `true`, which will significantly reduce the
+storage size of the manifest. But the Paimon sdk in reading engine requires at least version 0.9.1 or 1.0.0 or higher.
 
 ### Field Default Value
 
diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index a38f07784fd38..fad1f4907e5a9 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -485,9 +485,9 @@
         </tr>
         <tr>
             <td><h5>metadata.stats-dense-store</h5></td>
-            <td style="word-wrap: break-word;">false</td>
+            <td style="word-wrap: break-word;">true</td>
             <td>Boolean</td>
-            <td>Whether to store statistic densely in metadata (manifest files), which will significantly reduce the storage size of metadata when the none statistic mode is set.<br />Note, when this mode is enabled, the Paimon sdk in reading engine requires at least version 0.9.1 or 1.0.0 or higher.</td>
+            <td>Whether to store statistic densely in metadata (manifest files), which will significantly reduce the storage size of metadata when the none statistic mode is set.<br />Note, when this mode is enabled with 'metadata.stats-mode:none', the Paimon sdk in reading engine requires at least version 0.9.1 or 1.0.0 or higher.</td>
         </tr>
         <tr>
             <td><h5>metadata.stats-mode</h5></td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index fce09357f07ae..b9b5675f1d2d5 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -1101,7 +1101,7 @@ public class CoreOptions implements Serializable {
     public static final ConfigOption<Boolean> METADATA_STATS_DENSE_STORE =
             key("metadata.stats-dense-store")
                     .booleanType()
-                    .defaultValue(false)
+                    .defaultValue(true)
                     .withDescription(
                             Description.builder()
                                     .text(
@@ -1110,8 +1110,8 @@ public class CoreOptions implements Serializable {
                                                     + " none statistic mode is set.")
                                     .linebreak()
                                     .text(
-                                            "Note, when this mode is enabled, the Paimon sdk in reading engine requires"
-                                                    + " at least version 0.9.1 or 1.0.0 or higher.")
+                                            "Note, when this mode is enabled with 'metadata.stats-mode:none', the Paimon sdk in"
+                                                    + " reading engine requires at least version 0.9.1 or 1.0.0 or higher.")
                                     .build());
 
     public static final ConfigOption<String> COMMIT_CALLBACKS =
diff --git a/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java b/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
index 494b2e28e4593..25282d898a3dd 100644
--- a/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
@@ -35,6 +35,7 @@
 
 import org.junit.jupiter.api.Test;
 
+import static org.apache.paimon.CoreOptions.METADATA_STATS_DENSE_STORE;
 import static org.apache.paimon.CoreOptions.METADATA_STATS_MODE;
 import static org.assertj.core.api.Assertions.assertThat;
 
@@ -42,10 +43,11 @@
 public class StatsTableTest extends TableTestBase {
 
     @Test
-    public void testPartitionStats() throws Exception {
+    public void testPartitionStatsNotDense() throws Exception {
         Identifier identifier = identifier("T");
         Options options = new Options();
         options.set(METADATA_STATS_MODE, "NONE");
+        options.set(METADATA_STATS_DENSE_STORE, false);
         options.set(CoreOptions.BUCKET, 1);
         Schema schema =
                 Schema.newBuilder()
@@ -90,4 +92,52 @@ public void testPartitionStats() throws Exception {
         assertThat(recordStats.maxValues().isNullAt(1)).isTrue();
         assertThat(recordStats.maxValues().isNullAt(2)).isTrue();
     }
+
+    @Test
+    public void testPartitionStatsDenseMode() throws Exception {
+        Identifier identifier = identifier("T");
+        Options options = new Options();
+        options.set(METADATA_STATS_MODE, "NONE");
+        options.set(CoreOptions.BUCKET, 1);
+        Schema schema =
+                Schema.newBuilder()
+                        .column("pt", DataTypes.INT())
+                        .column("pk", DataTypes.INT())
+                        .column("col1", DataTypes.INT())
+                        .partitionKeys("pt")
+                        .primaryKey("pk", "pt")
+                        .options(options.toMap())
+                        .build();
+        catalog.createTable(identifier, schema, true);
+        Table table = catalog.getTable(identifier);
+
+        write(
+                table,
+                GenericRow.of(1, 1, 1),
+                GenericRow.of(1, 2, 1),
+                GenericRow.of(1, 3, 1),
+                GenericRow.of(2, 1, 1));
+
+        FileStoreTable storeTable = (FileStoreTable) table;
+        FileStore<?> store = storeTable.store();
+        String manifestListFile = storeTable.snapshotManager().latestSnapshot().deltaManifestList();
+
+        ManifestList manifestList = store.manifestListFactory().create();
+        ManifestFileMeta manifest = manifestList.read(manifestListFile).get(0);
+
+        // should have partition stats
+        SimpleStats partitionStats = manifest.partitionStats();
+        assertThat(partitionStats.minValues().getInt(0)).isEqualTo(1);
+        assertThat(partitionStats.maxValues().getInt(0)).isEqualTo(2);
+
+        // should not have record stats because of NONE mode
+        ManifestFile manifestFile = store.manifestFileFactory().create();
+        DataFileMeta file =
+                manifestFile.read(manifest.fileName(), manifest.fileSize()).get(0).file();
+        SimpleStats recordStats = file.valueStats();
+        assertThat(file.valueStatsCols()).isEmpty();
+        assertThat(recordStats.minValues().getFieldCount()).isEqualTo(0);
+        assertThat(recordStats.maxValues().getFieldCount()).isEqualTo(0);
+        assertThat(recordStats.nullCounts().size()).isEqualTo(0);
+    }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
index 0328cc6bada34..922221bb8dc99 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
@@ -230,7 +230,6 @@ public void testBatchProjection() throws Exception {
     public void testBatchFilter(boolean statsDenseStore) throws Exception {
         Consumer<Options> optionsSetter =
                 options -> {
-                    options.set(CoreOptions.METADATA_STATS_DENSE_STORE, statsDenseStore);
                     if (statsDenseStore) {
                         options.set(CoreOptions.METADATA_STATS_MODE, "none");
                         options.set("fields.b.stats-mode", "full");
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index 51c8b328dfc6a..46b85223bc2fa 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -348,7 +348,6 @@ public void testBatchProjection() throws Exception {
     public void testBatchFilter(boolean statsDenseStore) throws Exception {
         Consumer<Options> optionsSetter =
                 options -> {
-                    options.set(CoreOptions.METADATA_STATS_DENSE_STORE, statsDenseStore);
                     if (statsDenseStore) {
                         // pk table doesn't need value stats
                         options.set(CoreOptions.METADATA_STATS_MODE, "none");
@@ -1664,7 +1663,6 @@ public void testReadDeletionVectorTable(boolean statsDenseStore) throws Exceptio
                     options.set(TARGET_FILE_SIZE, new MemorySize(1));
                     options.set(DELETION_VECTORS_ENABLED, true);
 
-                    options.set(CoreOptions.METADATA_STATS_DENSE_STORE, statsDenseStore);
                     if (statsDenseStore) {
                         options.set(CoreOptions.METADATA_STATS_MODE, "none");
                         options.set("fields.b.stats-mode", "full");

From 39b82ec160414f7ca2cdafed0fc453f3fc7a7529 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 2 Dec 2024 15:46:40 +0800
Subject: [PATCH 088/157] [flink] Replace legacy SinkFunction with v2 Sink
 (#4612)

---
 .../connector/sink2/WriterInitContext.java    | 22 +++++
 .../api/functions/sink/v2/DiscardingSink.java | 58 +++++++++++++
 .../connector/sink2/WriterInitContext.java    | 22 +++++
 .../api/functions/sink/v2/DiscardingSink.java | 58 +++++++++++++
 .../connector/sink2/WriterInitContext.java    | 25 ++++++
 .../api/functions/sink/v2/DiscardingSink.java | 59 +++++++++++++
 .../connector/sink2/WriterInitContext.java    | 22 +++++
 .../api/functions/sink/v2/DiscardingSink.java | 59 +++++++++++++
 .../sink/cdc/FlinkCdcMultiTableSink.java      |  4 +-
 .../sink/cdc/FlinkCdcMultiTableSinkTest.java  |  5 +-
 .../paimon/flink/action/CloneAction.java      |  4 +-
 .../flink/service/QueryAddressRegister.java   | 84 +++++++++++--------
 .../paimon/flink/service/QueryService.java    |  2 +-
 .../sink/CombinedTableCompactorSink.java      |  4 +-
 .../apache/paimon/flink/sink/FlinkSink.java   |  4 +-
 .../sink/WriterChainingStrategyTest.java      |  2 +-
 16 files changed, 384 insertions(+), 50 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
 create mode 100644 paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
 create mode 100644 paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
 create mode 100644 paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java

diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
new file mode 100644
index 0000000000000..563dbbe75e7e6
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.connector.sink2;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface WriterInitContext extends org.apache.flink.api.connector.sink2.Sink.InitContext {}
diff --git a/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
new file mode 100644
index 0000000000000..98aaf6418ff7f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.15/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
@@ -0,0 +1,58 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.streaming.api.functions.sink.v2;
+
+import org.apache.flink.annotation.PublicEvolving;
+import org.apache.flink.api.connector.sink2.Sink;
+import org.apache.flink.api.connector.sink2.SinkWriter;
+
+import java.io.IOException;
+
+/**
+ * A special sink that ignores all elements.
+ *
+ * @param <IN> The type of elements received by the sink.
+ */
+@PublicEvolving
+public class DiscardingSink<IN> implements Sink<IN> {
+    private static final long serialVersionUID = 1L;
+
+    @Override
+    public SinkWriter<IN> createWriter(InitContext context) throws IOException {
+        return new DiscardingElementWriter();
+    }
+
+    private class DiscardingElementWriter implements SinkWriter<IN> {
+
+        @Override
+        public void write(IN element, Context context) throws IOException, InterruptedException {
+            // discard it.
+        }
+
+        @Override
+        public void flush(boolean endOfInput) throws IOException, InterruptedException {
+            // this writer has no pending data.
+        }
+
+        @Override
+        public void close() throws Exception {
+            // do nothing.
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
new file mode 100644
index 0000000000000..563dbbe75e7e6
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.connector.sink2;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface WriterInitContext extends org.apache.flink.api.connector.sink2.Sink.InitContext {}
diff --git a/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
new file mode 100644
index 0000000000000..98aaf6418ff7f
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.16/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
@@ -0,0 +1,58 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.streaming.api.functions.sink.v2;
+
+import org.apache.flink.annotation.PublicEvolving;
+import org.apache.flink.api.connector.sink2.Sink;
+import org.apache.flink.api.connector.sink2.SinkWriter;
+
+import java.io.IOException;
+
+/**
+ * A special sink that ignores all elements.
+ *
+ * @param <IN> The type of elements received by the sink.
+ */
+@PublicEvolving
+public class DiscardingSink<IN> implements Sink<IN> {
+    private static final long serialVersionUID = 1L;
+
+    @Override
+    public SinkWriter<IN> createWriter(InitContext context) throws IOException {
+        return new DiscardingElementWriter();
+    }
+
+    private class DiscardingElementWriter implements SinkWriter<IN> {
+
+        @Override
+        public void write(IN element, Context context) throws IOException, InterruptedException {
+            // discard it.
+        }
+
+        @Override
+        public void flush(boolean endOfInput) throws IOException, InterruptedException {
+            // this writer has no pending data.
+        }
+
+        @Override
+        public void close() throws Exception {
+            // do nothing.
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
new file mode 100644
index 0000000000000..db45000425723
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
@@ -0,0 +1,25 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.connector.sink2;
+
+import org.apache.flink.annotation.Public;
+
+/** Placeholder class to resolve compatibility issues. */
+@Public
+public interface WriterInitContext extends org.apache.flink.api.connector.sink2.Sink.InitContext {}
diff --git a/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
new file mode 100644
index 0000000000000..fc7eb0d483569
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.17/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.streaming.api.functions.sink.v2;
+
+import org.apache.flink.annotation.PublicEvolving;
+import org.apache.flink.api.common.SupportsConcurrentExecutionAttempts;
+import org.apache.flink.api.connector.sink2.Sink;
+import org.apache.flink.api.connector.sink2.SinkWriter;
+
+import java.io.IOException;
+
+/**
+ * A special sink that ignores all elements.
+ *
+ * @param <IN> The type of elements received by the sink.
+ */
+@PublicEvolving
+public class DiscardingSink<IN> implements Sink<IN>, SupportsConcurrentExecutionAttempts {
+    private static final long serialVersionUID = 1L;
+
+    @Override
+    public SinkWriter<IN> createWriter(InitContext context) throws IOException {
+        return new DiscardingElementWriter();
+    }
+
+    private class DiscardingElementWriter implements SinkWriter<IN> {
+
+        @Override
+        public void write(IN element, Context context) throws IOException, InterruptedException {
+            // discard it.
+        }
+
+        @Override
+        public void flush(boolean endOfInput) throws IOException, InterruptedException {
+            // this writer has no pending data.
+        }
+
+        @Override
+        public void close() throws Exception {
+            // do nothing.
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
new file mode 100644
index 0000000000000..563dbbe75e7e6
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/api/connector/sink2/WriterInitContext.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.api.connector.sink2;
+
+/** Placeholder class to resolve compatibility issues. */
+public interface WriterInitContext extends org.apache.flink.api.connector.sink2.Sink.InitContext {}
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
new file mode 100644
index 0000000000000..fc7eb0d483569
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/flink/streaming/api/functions/sink/v2/DiscardingSink.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.streaming.api.functions.sink.v2;
+
+import org.apache.flink.annotation.PublicEvolving;
+import org.apache.flink.api.common.SupportsConcurrentExecutionAttempts;
+import org.apache.flink.api.connector.sink2.Sink;
+import org.apache.flink.api.connector.sink2.SinkWriter;
+
+import java.io.IOException;
+
+/**
+ * A special sink that ignores all elements.
+ *
+ * @param <IN> The type of elements received by the sink.
+ */
+@PublicEvolving
+public class DiscardingSink<IN> implements Sink<IN>, SupportsConcurrentExecutionAttempts {
+    private static final long serialVersionUID = 1L;
+
+    @Override
+    public SinkWriter<IN> createWriter(InitContext context) throws IOException {
+        return new DiscardingElementWriter();
+    }
+
+    private class DiscardingElementWriter implements SinkWriter<IN> {
+
+        @Override
+        public void write(IN element, Context context) throws IOException, InterruptedException {
+            // discard it.
+        }
+
+        @Override
+        public void flush(boolean endOfInput) throws IOException, InterruptedException {
+            // this writer has no pending data.
+        }
+
+        @Override
+        public void close() throws Exception {
+            // do nothing.
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
index f9b7bbc6b9105..1688d4deb0884 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSink.java
@@ -40,7 +40,7 @@
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
+import org.apache.flink.streaming.api.functions.sink.v2.DiscardingSink;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 
 import javax.annotation.Nullable;
@@ -134,7 +134,7 @@ public DataStreamSink<?> sinkFrom(
                                         createCommittableStateManager()))
                         .setParallelism(input.getParallelism());
         configureGlobalCommitter(committed, commitCpuCores, commitHeapMemory);
-        return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
+        return committed.sinkTo(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
     protected OneInputStreamOperatorFactory<CdcMultiplexRecord, MultiTableCommittable>
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
index e1bd112ca751e..723f57a30e3f7 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
@@ -22,11 +22,11 @@
 import org.apache.paimon.flink.FlinkConnectorOptions;
 import org.apache.paimon.options.Options;
 
+import org.apache.flink.api.dag.Transformation;
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.apache.flink.streaming.api.functions.source.ParallelSourceFunction;
-import org.apache.flink.streaming.api.transformations.LegacySinkTransformation;
 import org.apache.flink.streaming.api.transformations.OneInputTransformation;
 import org.apache.flink.streaming.api.transformations.PartitionTransformation;
 import org.junit.jupiter.api.Test;
@@ -64,8 +64,7 @@ public void cancel() {}
         DataStreamSink<?> dataStreamSink = sink.sinkFrom(input);
 
         // check the transformation graph
-        LegacySinkTransformation<?> end =
-                (LegacySinkTransformation<?>) dataStreamSink.getTransformation();
+        Transformation<?> end = dataStreamSink.getTransformation();
         assertThat(end.getName()).isEqualTo("end");
 
         OneInputTransformation<?, ?> committer =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CloneAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CloneAction.java
index 2f90147eeb2a3..bac030dd04966 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CloneAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/CloneAction.java
@@ -32,7 +32,7 @@
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
+import org.apache.flink.streaming.api.functions.sink.v2.DiscardingSink;
 
 import java.util.HashMap;
 import java.util.Map;
@@ -141,7 +141,7 @@ copyFiles, new SnapshotHintChannelComputer(), parallelism)
                                 new SnapshotHintOperator(targetCatalogConfig))
                         .setParallelism(parallelism);
 
-        snapshotHintOperator.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
+        snapshotHintOperator.sinkTo(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
index 524f2e5f01c17..00d527506cfef 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryAddressRegister.java
@@ -23,10 +23,9 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 
-import org.apache.flink.api.common.functions.OpenContext;
-import org.apache.flink.configuration.Configuration;
-import org.apache.flink.streaming.api.functions.sink.RichSinkFunction;
-import org.apache.flink.streaming.api.functions.sink.SinkFunction;
+import org.apache.flink.api.connector.sink2.Sink;
+import org.apache.flink.api.connector.sink2.SinkWriter;
+import org.apache.flink.api.connector.sink2.WriterInitContext;
 
 import java.net.InetSocketAddress;
 import java.util.TreeMap;
@@ -34,57 +33,68 @@
 import static org.apache.paimon.service.ServiceManager.PRIMARY_KEY_LOOKUP;
 
 /** Operator for address server to register addresses to {@link ServiceManager}. */
-public class QueryAddressRegister extends RichSinkFunction<InternalRow> {
-
+public class QueryAddressRegister implements Sink<InternalRow> {
     private final ServiceManager serviceManager;
 
-    private transient int numberExecutors;
-    private transient TreeMap<Integer, InetSocketAddress> executors;
-
     public QueryAddressRegister(Table table) {
         this.serviceManager = ((FileStoreTable) table).store().newServiceManager();
     }
 
     /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
      */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    public SinkWriter<InternalRow> createWriter(InitContext context) {
+        return new QueryAddressRegisterSinkWriter(serviceManager);
     }
 
     /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
+     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
      */
-    public void open(Configuration parameters) throws Exception {
-        this.executors = new TreeMap<>();
+    public SinkWriter<InternalRow> createWriter(WriterInitContext context) {
+        return new QueryAddressRegisterSinkWriter(serviceManager);
     }
 
-    @Override
-    public void invoke(InternalRow row, SinkFunction.Context context) {
-        int numberExecutors = row.getInt(0);
-        if (this.numberExecutors != 0 && this.numberExecutors != numberExecutors) {
-            throw new IllegalArgumentException(
-                    String.format(
-                            "Number Executors can not be changed! Old %s , New %s .",
-                            this.numberExecutors, numberExecutors));
-        }
-        this.numberExecutors = numberExecutors;
+    private static class QueryAddressRegisterSinkWriter implements SinkWriter<InternalRow> {
+        private final ServiceManager serviceManager;
 
-        int executorId = row.getInt(1);
-        String hostname = row.getString(2).toString();
-        int port = row.getInt(3);
+        private final TreeMap<Integer, InetSocketAddress> executors;
 
-        executors.put(executorId, new InetSocketAddress(hostname, port));
+        private int numberExecutors;
 
-        if (executors.size() == numberExecutors) {
-            serviceManager.resetService(
-                    PRIMARY_KEY_LOOKUP, executors.values().toArray(new InetSocketAddress[0]));
+        private QueryAddressRegisterSinkWriter(ServiceManager serviceManager) {
+            this.serviceManager = serviceManager;
+            this.executors = new TreeMap<>();
         }
-    }
 
-    @Override
-    public void close() throws Exception {
-        super.close();
-        serviceManager.deleteService(PRIMARY_KEY_LOOKUP);
+        @Override
+        public void write(InternalRow row, Context context) {
+            int numberExecutors = row.getInt(0);
+            if (this.numberExecutors != 0 && this.numberExecutors != numberExecutors) {
+                throw new IllegalArgumentException(
+                        String.format(
+                                "Number Executors can not be changed! Old %s , New %s .",
+                                this.numberExecutors, numberExecutors));
+            }
+            this.numberExecutors = numberExecutors;
+
+            int executorId = row.getInt(1);
+            String hostname = row.getString(2).toString();
+            int port = row.getInt(3);
+
+            executors.put(executorId, new InetSocketAddress(hostname, port));
+
+            if (executors.size() == numberExecutors) {
+                serviceManager.resetService(
+                        PRIMARY_KEY_LOOKUP, executors.values().toArray(new InetSocketAddress[0]));
+            }
+        }
+
+        @Override
+        public void flush(boolean endOfInput) {}
+
+        @Override
+        public void close() {
+            serviceManager.deleteService(PRIMARY_KEY_LOOKUP);
+        }
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryService.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryService.java
index bd433fe0f00d0..752d54cff5a0f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryService.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryService.java
@@ -62,7 +62,7 @@ public static void build(StreamExecutionEnvironment env, Table table, int parall
                                 InternalTypeInfo.fromRowType(QueryExecutorOperator.outputType()),
                                 executorOperator)
                         .setParallelism(parallelism)
-                        .addSink(new QueryAddressRegister(table))
+                        .sinkTo(new QueryAddressRegister(table))
                         .setParallelism(1);
 
         sink.getTransformation().setMaxParallelism(1);
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
index c2b4cc0f87e60..25f76ce976833 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/CombinedTableCompactorSink.java
@@ -32,7 +32,7 @@
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
+import org.apache.flink.streaming.api.functions.sink.v2.DiscardingSink;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.table.data.RowData;
 
@@ -171,7 +171,7 @@ protected DataStreamSink<?> doCommit(
         if (!options.get(SINK_COMMITTER_OPERATOR_CHAINING)) {
             committed = committed.startNewChain();
         }
-        return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
+        return committed.sinkTo(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
     // TODO:refactor FlinkSink to adopt this sink
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
index 8d6c3554c76ff..002f5887b5f08 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSink.java
@@ -43,7 +43,7 @@
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.CheckpointConfig;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.sink.DiscardingSink;
+import org.apache.flink.streaming.api.functions.sink.v2.DiscardingSink;
 import org.apache.flink.streaming.api.operators.OneInputStreamOperatorFactory;
 import org.apache.flink.table.api.config.ExecutionConfigOptions;
 
@@ -316,7 +316,7 @@ protected DataStreamSink<?> doCommit(DataStream<Committable> written, String com
         }
         configureGlobalCommitter(
                 committed, options.get(SINK_COMMITTER_CPU), options.get(SINK_COMMITTER_MEMORY));
-        return committed.addSink(new DiscardingSink<>()).name("end").setParallelism(1);
+        return committed.sinkTo(new DiscardingSink<>()).name("end").setParallelism(1);
     }
 
     public static void configureGlobalCommitter(
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java
index a4605b830918e..24fb529b59ea2 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/WriterChainingStrategyTest.java
@@ -173,7 +173,7 @@ private List<JobVertex> verifyChaining(
 
         List<JobVertex> vertices = new ArrayList<>();
         env.getStreamGraph().getJobGraph().getVertices().forEach(vertices::add);
-        JobVertex vertex = findVertex(vertices, "Writer");
+        JobVertex vertex = findVertex(vertices, "Writer(write-only)");
 
         if (isWriterChainedWithUpstream) {
             assertThat(vertex.toString()).contains("Source");

From 271de7deac24b5ecc6306d345dcb5607d9f4a35a Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Mon, 2 Dec 2024 15:59:39 +0800
Subject: [PATCH 089/157] [docs] Add document for nested column evolution
 (#4619)

---
 docs/content/flink/sql-alter.md | 16 +++++++
 docs/content/spark/sql-alter.md | 84 +++++++++++++++++++++++++++++++++
 2 files changed, 100 insertions(+)

diff --git a/docs/content/flink/sql-alter.md b/docs/content/flink/sql-alter.md
index bee616f047d42..877995cc631bb 100644
--- a/docs/content/flink/sql-alter.md
+++ b/docs/content/flink/sql-alter.md
@@ -78,6 +78,10 @@ If you use object storage, such as S3 or OSS, please use this syntax carefully,
 
 The following SQL adds two columns `c1` and `c2` to table `my_table`.
 
+{{< hint info >}}
+To add a column in a row type, see [Changing Column Type](#changing-column-type).
+{{< /hint >}}
+
 ```sql
 ALTER TABLE my_table ADD (c1 INT, c2 STRING);
 ```
@@ -99,6 +103,10 @@ otherwise this operation may fail, throws an exception like `The following colum
 ALTER TABLE my_table DROP (c1, c2);
 ```
 
+{{< hint info >}}
+To drop a column in a row type, see [Changing Column Type](#changing-column-type).
+{{< /hint >}}
+
 ## Dropping Partitions
 
 The following SQL drops the partitions of the paimon table.
@@ -185,6 +193,14 @@ The following SQL changes type of column `col_a` to `DOUBLE`.
 ALTER TABLE my_table MODIFY col_a DOUBLE;
 ```
 
+Paimon also supports changing columns of row type, array type, and map type.
+
+```sql
+-- col_a previously has type ARRAY<MAP<INT, ROW(f1 INT, f2 STRING)>>
+-- the following SQL changes f1 to BIGINT, drops f2, and adds f3
+ALTER TABLE my_table MODIFY col_a ARRAY<MAP<INT, ROW(f1 BIGINT, f3 DOUBLE)>>;
+```
+
 ## Adding watermark
 
 The following SQL adds a computed column `ts` from existing column `log_ts`, and a watermark with strategy `ts - INTERVAL '1' HOUR` on column `ts` which is marked as event time attribute of table `my_table`.
diff --git a/docs/content/spark/sql-alter.md b/docs/content/spark/sql-alter.md
index 11af186e62131..3ad72048029b0 100644
--- a/docs/content/spark/sql-alter.md
+++ b/docs/content/spark/sql-alter.md
@@ -95,6 +95,27 @@ ALTER TABLE my_table ADD COLUMNS (
 );
 ```
 
+The following SQL adds a nested column `f3` to a struct type.
+
+```sql
+-- column v previously has type STRUCT<f1: STRING, f2: INT>
+ALTER TABLE my_table ADD COLUMN v.f3 STRING;
+```
+
+The following SQL adds a nested column `f3` to a struct type, which is the element type of an array type.
+
+```sql
+-- column v previously has type ARRAY<STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table ADD COLUMN v.element.f3 STRING;
+```
+
+The following SQL adds a nested column `f3` to a struct type, which is the value type of a map type.
+
+```sql
+-- column v previously has type MAP<INT, STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table ADD COLUMN v.value.f3 STRING;
+```
+
 ## Renaming Column Name
 
 The following SQL renames column `c0` in table `my_table` to `c1`.
@@ -103,6 +124,27 @@ The following SQL renames column `c0` in table `my_table` to `c1`.
 ALTER TABLE my_table RENAME COLUMN c0 TO c1;
 ```
 
+The following SQL renames a nested column `f1` to `f100` in a struct type.
+
+```sql
+-- column v previously has type STRUCT<f1: STRING, f2: INT>
+ALTER TABLE my_table RENAME COLUMN v.f1 to f100;
+```
+
+The following SQL renames a nested column `f1` to `f100` in a struct type, which is the element type of an array type.
+
+```sql
+-- column v previously has type ARRAY<STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table RENAME COLUMN v.element.f1 to f100;
+```
+
+The following SQL renames a nested column `f1` to `f100` in a struct type, which is the value type of a map type.
+
+```sql
+-- column v previously has type MAP<INT, STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table RENAME COLUMN v.value.f1 to f100;
+```
+
 ## Dropping Columns
 
 The following SQL drops two columns `c1` and `c2` from table `my_table`.
@@ -111,6 +153,27 @@ The following SQL drops two columns `c1` and `c2` from table `my_table`.
 ALTER TABLE my_table DROP COLUMNS (c1, c2);
 ```
 
+The following SQL drops a nested column `f2` from a struct type.
+
+```sql
+-- column v previously has type STRUCT<f1: STRING, f2: INT>
+ALTER TABLE my_table DROP COLUMN v.f2;
+```
+
+The following SQL drops a nested column `f2` from a struct type, which is the element type of an array type.
+
+```sql
+-- column v previously has type ARRAY<STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table DROP COLUMN v.element.f2;
+```
+
+The following SQL drops a nested column `f2` from a struct type, which is the value type of a map type.
+
+```sql
+-- column v previously has type MAP<INT, STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table DROP COLUMN v.value.f2;
+```
+
 ## Dropping Partitions
 
 The following SQL drops the partitions of the paimon table. For spark sql, you need to specify all the partition columns.
@@ -156,3 +219,24 @@ ALTER TABLE my_table ALTER COLUMN col_a AFTER col_b;
 ```sql
 ALTER TABLE my_table ALTER COLUMN col_a TYPE DOUBLE;
 ```
+
+The following SQL changes the type of a nested column `f2` to `BIGINT` in a struct type.
+
+```sql
+-- column v previously has type STRUCT<f1: STRING, f2: INT>
+ALTER TABLE my_table ALTER COLUMN v.f2 TYPE BIGINT;
+```
+
+The following SQL changes the type of a nested column `f2` to `BIGINT` in a struct type, which is the element type of an array type.
+
+```sql
+-- column v previously has type ARRAY<STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table ALTER COLUMN v.element.f2 TYPE BIGINT;
+```
+
+The following SQL changes the type of a nested column `f2` to `BIGINT` in a struct type, which is the value type of a map type.
+
+```sql
+-- column v previously has type MAP<INT, STRUCT<f1: STRING, f2: INT>>
+ALTER TABLE my_table ALTER COLUMN v.value.f2 TYPE BIGINT;
+```

From 4e1b74976590fbe5d885614b65e038217c9266df Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 2 Dec 2024 18:13:33 +0800
Subject: [PATCH 090/157] [iceberg] Use gzip by default to iceberg avro writer
 (#4620)

---
 docs/content/migration/iceberg-compatibility.md   |  6 ++++++
 .../org/apache/paimon/iceberg/IcebergOptions.java |  7 +++++++
 .../iceberg/manifest/IcebergManifestFile.java     | 15 +++++++++++----
 .../iceberg/manifest/IcebergManifestList.java     | 15 +++++++++++----
 .../paimon/iceberg/IcebergCompatibilityTest.java  |  6 ++++++
 5 files changed, 41 insertions(+), 8 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index f07f78cb201df..7b83936b53208 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -371,6 +371,12 @@ you also need to set some (or all) of the following table options when creating
       <td>String</td>
       <td>hadoop-conf-dir for Iceberg Hive catalog.</td>
     </tr>
+    <tr>
+      <td><h5>metadata.iceberg.manifest-compression</h5></td>
+      <td style="word-wrap: break-word;">gzip</td>
+      <td>String</td>
+      <td>Compression for Iceberg manifest files.</td>
+    </tr>
     </tbody>
 </table>
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
index 769ce6b1614af..3900233d21cea 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
@@ -70,6 +70,13 @@ public class IcebergOptions {
                     .noDefaultValue()
                     .withDescription("hadoop-conf-dir for Iceberg Hive catalog.");
 
+    public static final ConfigOption<String> MANIFEST_COMPRESSION =
+            key("metadata.iceberg.manifest-compression")
+                    .stringType()
+                    .defaultValue(
+                            "gzip") // some Iceberg reader cannot support zstd, for example DuckDB
+                    .withDescription("Compression for Iceberg manifest files.");
+
     /** Where to store Iceberg metadata. */
     public enum StorageType implements DescribedEnum {
         DISABLED("disabled", "Disable Iceberg compatibility support."),
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
index d04cf3576a111..57484a1f3ff92 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.iceberg.manifest;
 
 import org.apache.paimon.CoreOptions;
+import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.format.FileFormat;
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.format.FormatWriterFactory;
@@ -26,6 +27,7 @@
 import org.apache.paimon.format.SimpleStatsCollector;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.iceberg.IcebergOptions;
 import org.apache.paimon.iceberg.IcebergPathFactory;
 import org.apache.paimon.iceberg.manifest.IcebergManifestFileMeta.Content;
 import org.apache.paimon.iceberg.metadata.IcebergPartitionSpec;
@@ -82,23 +84,28 @@ public IcebergManifestFile(
         this.targetFileSize = targetFileSize;
     }
 
+    @VisibleForTesting
+    public String compression() {
+        return compression;
+    }
+
     public static IcebergManifestFile create(FileStoreTable table, IcebergPathFactory pathFactory) {
         RowType partitionType = table.schema().logicalPartitionType();
         RowType entryType = IcebergManifestEntry.schema(partitionType);
-        Options manifestFileAvroOptions = Options.fromMap(table.options());
+        Options avroOptions = Options.fromMap(table.options());
         // https://github.com/apache/iceberg/blob/main/core/src/main/java/org/apache/iceberg/ManifestReader.java
-        manifestFileAvroOptions.set(
+        avroOptions.set(
                 "avro.row-name-mapping",
                 "org.apache.paimon.avro.generated.record:manifest_entry,"
                         + "manifest_entry_data_file:r2,"
                         + "r2_partition:r102");
-        FileFormat manifestFileAvro = FileFormat.fromIdentifier("avro", manifestFileAvroOptions);
+        FileFormat manifestFileAvro = FileFormat.fromIdentifier("avro", avroOptions);
         return new IcebergManifestFile(
                 table.fileIO(),
                 partitionType,
                 manifestFileAvro.createReaderFactory(entryType),
                 manifestFileAvro.createWriterFactory(entryType),
-                table.coreOptions().manifestCompression(),
+                avroOptions.get(IcebergOptions.MANIFEST_COMPRESSION),
                 pathFactory.manifestFileFactory(),
                 table.coreOptions().manifestTargetSize());
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
index 911ebf954ce53..ab5cc926cd961 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
@@ -18,10 +18,12 @@
 
 package org.apache.paimon.iceberg.manifest;
 
+import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.format.FileFormat;
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.format.FormatWriterFactory;
 import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.iceberg.IcebergOptions;
 import org.apache.paimon.iceberg.IcebergPathFactory;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.table.FileStoreTable;
@@ -51,19 +53,24 @@ public IcebergManifestList(
                 null);
     }
 
+    @VisibleForTesting
+    public String compression() {
+        return compression;
+    }
+
     public static IcebergManifestList create(FileStoreTable table, IcebergPathFactory pathFactory) {
-        Options manifestListAvroOptions = Options.fromMap(table.options());
+        Options avroOptions = Options.fromMap(table.options());
         // https://github.com/apache/iceberg/blob/main/core/src/main/java/org/apache/iceberg/ManifestLists.java
-        manifestListAvroOptions.set(
+        avroOptions.set(
                 "avro.row-name-mapping",
                 "org.apache.paimon.avro.generated.record:manifest_file,"
                         + "manifest_file_partitions:r508");
-        FileFormat manifestListAvro = FileFormat.fromIdentifier("avro", manifestListAvroOptions);
+        FileFormat manifestListAvro = FileFormat.fromIdentifier("avro", avroOptions);
         return new IcebergManifestList(
                 table.fileIO(),
                 manifestListAvro.createReaderFactory(IcebergManifestFileMeta.schema()),
                 manifestListAvro.createWriterFactory(IcebergManifestFileMeta.schema()),
-                table.coreOptions().manifestCompression(),
+                avroOptions.get(IcebergOptions.MANIFEST_COMPRESSION),
                 pathFactory.manifestListFactory());
     }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
index 9a27d5618459e..45cfe109b9869 100644
--- a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
@@ -30,6 +30,7 @@
 import org.apache.paimon.disk.IOManagerImpl;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
+import org.apache.paimon.iceberg.manifest.IcebergManifestFile;
 import org.apache.paimon.iceberg.manifest.IcebergManifestFileMeta;
 import org.apache.paimon.iceberg.manifest.IcebergManifestList;
 import org.apache.paimon.iceberg.metadata.IcebergMetadata;
@@ -302,6 +303,11 @@ public void testIcebergSnapshotExpire() throws Exception {
         IcebergPathFactory pathFactory =
                 new IcebergPathFactory(new Path(table.location(), "metadata"));
         IcebergManifestList manifestList = IcebergManifestList.create(table, pathFactory);
+        assertThat(manifestList.compression()).isEqualTo("gzip");
+
+        IcebergManifestFile manifestFile = IcebergManifestFile.create(table, pathFactory);
+        assertThat(manifestFile.compression()).isEqualTo("gzip");
+
         Set<String> usingManifests = new HashSet<>();
         for (IcebergManifestFileMeta fileMeta :
                 manifestList.read(new Path(metadata.currentSnapshot().manifestList()).getName())) {

From 512e2ce05c15c388f81bf2b645546c9a29071a7b Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 2 Dec 2024 19:06:20 +0800
Subject: [PATCH 091/157] [iceberg] Introduce
 metadata.iceberg.manifest-legacy-version (#4621)

---
 .../migration/iceberg-compatibility.md        | 11 +++++++
 .../apache/paimon/iceberg/IcebergOptions.java |  7 +++++
 .../manifest/IcebergManifestFileMeta.java     | 29 ++++++++++++++++++-
 .../IcebergManifestFileMetaSerializer.java    |  5 ++--
 .../iceberg/manifest/IcebergManifestList.java | 24 ++++++++-------
 .../iceberg/IcebergCompatibilityTest.java     | 15 ++++++++--
 6 files changed, 75 insertions(+), 16 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 7b83936b53208..d745607148643 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -377,9 +377,20 @@ you also need to set some (or all) of the following table options when creating
       <td>String</td>
       <td>Compression for Iceberg manifest files.</td>
     </tr>
+    <tr>
+      <td><h5>metadata.iceberg.manifest-legacy-version</h5></td>
+      <td style="word-wrap: break-word;">false</td>
+      <td>Boolean</td>
+      <td>Should use the legacy manifest version to generate Iceberg's 1.4 manifest files.</td>
+    </tr>
     </tbody>
 </table>
 
+## AWS Athena
+
+AWS Athena may use old manifest reader to read Iceberg manifest by names, we should let Paimon producing legacy Iceberg
+manifest list file, you can enable: `'metadata.iceberg.manifest-legacy-version'`.
+
 ## Trino Iceberg
 
 In this example, we use Trino Iceberg connector to access Paimon table through Iceberg Hive catalog.
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
index 3900233d21cea..c0ceed97ba8cf 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
@@ -77,6 +77,13 @@ public class IcebergOptions {
                             "gzip") // some Iceberg reader cannot support zstd, for example DuckDB
                     .withDescription("Compression for Iceberg manifest files.");
 
+    public static final ConfigOption<Boolean> MANIFEST_LEGACY_VERSION =
+            key("metadata.iceberg.manifest-legacy-version")
+                    .booleanType()
+                    .defaultValue(false)
+                    .withDescription(
+                            "Should use the legacy manifest version to generate Iceberg's 1.4 manifest files.");
+
     /** Where to store Iceberg metadata. */
     public enum StorageType implements DescribedEnum {
         DISABLED("disabled", "Disable Iceberg compatibility support."),
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMeta.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMeta.java
index fd9c2daf7e208..c5fcb6005fcb8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMeta.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMeta.java
@@ -165,7 +165,11 @@ public List<IcebergPartitionSummary> partitions() {
         return partitions;
     }
 
-    public static RowType schema() {
+    public static RowType schema(boolean legacyVersion) {
+        return legacyVersion ? schemaForIceberg1_4() : schemaForIcebergNew();
+    }
+
+    private static RowType schemaForIcebergNew() {
         List<DataField> fields = new ArrayList<>();
         fields.add(new DataField(500, "manifest_path", DataTypes.STRING().notNull()));
         fields.add(new DataField(501, "manifest_length", DataTypes.BIGINT().notNull()));
@@ -186,6 +190,29 @@ public static RowType schema() {
         return new RowType(false, fields);
     }
 
+    private static RowType schemaForIceberg1_4() {
+        // see https://github.com/apache/iceberg/pull/5338
+        // some reader still want old schema, for example, AWS athena
+        List<DataField> fields = new ArrayList<>();
+        fields.add(new DataField(500, "manifest_path", DataTypes.STRING().notNull()));
+        fields.add(new DataField(501, "manifest_length", DataTypes.BIGINT().notNull()));
+        fields.add(new DataField(502, "partition_spec_id", DataTypes.INT().notNull()));
+        fields.add(new DataField(517, "content", DataTypes.INT().notNull()));
+        fields.add(new DataField(515, "sequence_number", DataTypes.BIGINT().notNull()));
+        fields.add(new DataField(516, "min_sequence_number", DataTypes.BIGINT().notNull()));
+        fields.add(new DataField(503, "added_snapshot_id", DataTypes.BIGINT()));
+        fields.add(new DataField(504, "added_data_files_count", DataTypes.INT().notNull()));
+        fields.add(new DataField(505, "existing_data_files_count", DataTypes.INT().notNull()));
+        fields.add(new DataField(506, "deleted_data_files_count", DataTypes.INT().notNull()));
+        fields.add(new DataField(512, "added_rows_count", DataTypes.BIGINT().notNull()));
+        fields.add(new DataField(513, "existing_rows_count", DataTypes.BIGINT().notNull()));
+        fields.add(new DataField(514, "deleted_rows_count", DataTypes.BIGINT().notNull()));
+        fields.add(
+                new DataField(
+                        508, "partitions", DataTypes.ARRAY(IcebergPartitionSummary.schema())));
+        return new RowType(false, fields);
+    }
+
     @Override
     public boolean equals(Object o) {
         if (this == o) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMetaSerializer.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMetaSerializer.java
index c40a26e8fdf8f..2b4c9b771c599 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMetaSerializer.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFileMetaSerializer.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.data.InternalArray;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.iceberg.manifest.IcebergManifestFileMeta.Content;
+import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.ObjectSerializer;
 
 import java.util.ArrayList;
@@ -36,8 +37,8 @@ public class IcebergManifestFileMetaSerializer extends ObjectSerializer<IcebergM
 
     private final IcebergPartitionSummarySerializer partitionSummarySerializer;
 
-    public IcebergManifestFileMetaSerializer() {
-        super(IcebergManifestFileMeta.schema());
+    public IcebergManifestFileMetaSerializer(RowType schema) {
+        super(schema);
         this.partitionSummarySerializer = new IcebergPartitionSummarySerializer();
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
index ab5cc926cd961..ef78969a24d05 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestList.java
@@ -20,13 +20,12 @@
 
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.format.FileFormat;
-import org.apache.paimon.format.FormatReaderFactory;
-import org.apache.paimon.format.FormatWriterFactory;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.iceberg.IcebergOptions;
 import org.apache.paimon.iceberg.IcebergPathFactory;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.ObjectsFile;
 import org.apache.paimon.utils.PathFactory;
 
@@ -38,16 +37,16 @@ public class IcebergManifestList extends ObjectsFile<IcebergManifestFileMeta> {
 
     public IcebergManifestList(
             FileIO fileIO,
-            FormatReaderFactory readerFactory,
-            FormatWriterFactory writerFactory,
+            FileFormat fileFormat,
+            RowType manifestType,
             String compression,
             PathFactory pathFactory) {
         super(
                 fileIO,
-                new IcebergManifestFileMetaSerializer(),
-                IcebergManifestFileMeta.schema(),
-                readerFactory,
-                writerFactory,
+                new IcebergManifestFileMetaSerializer(manifestType),
+                manifestType,
+                fileFormat.createReaderFactory(manifestType),
+                fileFormat.createWriterFactory(manifestType),
                 compression,
                 pathFactory,
                 null);
@@ -65,11 +64,14 @@ public static IcebergManifestList create(FileStoreTable table, IcebergPathFactor
                 "avro.row-name-mapping",
                 "org.apache.paimon.avro.generated.record:manifest_file,"
                         + "manifest_file_partitions:r508");
-        FileFormat manifestListAvro = FileFormat.fromIdentifier("avro", avroOptions);
+        FileFormat fileFormat = FileFormat.fromIdentifier("avro", avroOptions);
+        RowType manifestType =
+                IcebergManifestFileMeta.schema(
+                        avroOptions.get(IcebergOptions.MANIFEST_LEGACY_VERSION));
         return new IcebergManifestList(
                 table.fileIO(),
-                manifestListAvro.createReaderFactory(IcebergManifestFileMeta.schema()),
-                manifestListAvro.createWriterFactory(IcebergManifestFileMeta.schema()),
+                fileFormat,
+                manifestType,
                 avroOptions.get(IcebergOptions.MANIFEST_COMPRESSION),
                 pathFactory.manifestListFactory());
     }
diff --git a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
index 45cfe109b9869..b069ac031d38b 100644
--- a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
@@ -78,6 +78,7 @@
 import java.util.stream.Collectors;
 
 import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
 /** Tests for Iceberg compatibility. */
 public class IcebergCompatibilityTest {
@@ -309,11 +310,21 @@ public void testIcebergSnapshotExpire() throws Exception {
         assertThat(manifestFile.compression()).isEqualTo("gzip");
 
         Set<String> usingManifests = new HashSet<>();
-        for (IcebergManifestFileMeta fileMeta :
-                manifestList.read(new Path(metadata.currentSnapshot().manifestList()).getName())) {
+        String manifestListFile = new Path(metadata.currentSnapshot().manifestList()).getName();
+        for (IcebergManifestFileMeta fileMeta : manifestList.read(manifestListFile)) {
             usingManifests.add(fileMeta.manifestPath());
         }
 
+        IcebergManifestList legacyManifestList =
+                IcebergManifestList.create(
+                        table.copy(
+                                Collections.singletonMap(
+                                        IcebergOptions.MANIFEST_LEGACY_VERSION.key(), "true")),
+                        pathFactory);
+        assertThatThrownBy(() -> legacyManifestList.read(manifestListFile))
+                .rootCause()
+                .isInstanceOf(NullPointerException.class);
+
         Set<String> unusedFiles = new HashSet<>();
         for (int i = 0; i < 2; i++) {
             unusedFiles.add(metadata.snapshots().get(i).manifestList());

From a5cb687755bcb02780e291f9d58538eb9a9d23e0 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Mon, 2 Dec 2024 19:12:55 +0800
Subject: [PATCH 092/157] [doc] Update Python API for pypaimon 0.2 (#4623)

---
 docs/content/program-api/python-api.md | 256 +++++++++++++++++--------
 1 file changed, 179 insertions(+), 77 deletions(-)

diff --git a/docs/content/program-api/python-api.md b/docs/content/program-api/python-api.md
index ff457cc55f446..86acee06d3a86 100644
--- a/docs/content/program-api/python-api.md
+++ b/docs/content/program-api/python-api.md
@@ -34,9 +34,9 @@ Java-based implementation will launch a JVM and use `py4j` to execute Java code
 
 ### SDK Installing
 
-SDK is published at [paimon-python](https://pypi.org/project/paimon-python/). You can install by
+SDK is published at [pypaimon](https://pypi.org/project/pypaimon/). You can install by
 ```shell
-pip install paimon-python
+pip install pypaimon
 ```
 
 ### Java Runtime Environment
@@ -67,7 +67,7 @@ classpath via one of the following ways:
 
 ```python
 import os
-from paimon_python_java import constants
+from pypaimon.py4j import constants
 
 os.environ[constants.PYPAIMON_JAVA_CLASSPATH] = '/path/to/jars/*'
 ```
@@ -81,7 +81,7 @@ You can set JVM args via one of the following ways:
 
 ```python
 import os
-from paimon_python_java import constants
+from pypaimon.py4j import constants
 
 os.environ[constants.PYPAIMON_JVM_ARGS] = 'arg1 arg2 ...'
 ```
@@ -98,7 +98,7 @@ Otherwise, you should set hadoop classpath via one of the following ways:
 
 ```python
 import os
-from paimon_python_java import constants
+from pypaimon.py4j import constants
 
 os.environ[constants.PYPAIMON_HADOOP_CLASSPATH] = '/path/to/jars/*'
 ```
@@ -111,7 +111,7 @@ If you just want to test codes in local, we recommend to use [Flink Pre-bundled
 Before coming into contact with the Table, you need to create a Catalog.
 
 ```python
-from paimon_python_java import Catalog
+from pypaimon.py4j import Catalog
 
 # Note that keys and values are all string
 catalog_options = {
@@ -138,12 +138,17 @@ catalog.create_database(
 
 ### Create Schema
 
-Table schema contains fields definition, partition keys, primary keys, table options and comment. For example:
+Table schema contains fields definition, partition keys, primary keys, table options and comment. 
+The field definition is described by `pyarrow.Schema`. All arguments except fields definition are optional.
+
+Generally, there are two ways to build `pyarrow.Schema`.
+
+First, you can use `pyarrow.schema` method directly, for example:
 
 ```python
 import pyarrow as pa
 
-from paimon_python_api import Schema
+from pypaimon import Schema
 
 pa_schema = pa.schema([
     ('dt', pa.string()),
@@ -161,13 +166,13 @@ schema = Schema(
 )
 ```
 
-All arguments except `pa_schema` is optional. If you have some Pandas data, the `pa_schema` can be extracted from `DataFrame`:
+Second, if you have some Pandas data, the `pa_schema` can be extracted from `DataFrame`:
 
 ```python
 import pandas as pd
 import pyarrow as pa
 
-from paimon_python_api import Schema
+from pypaimon import Schema
 
 # Example DataFrame data
 data = {
@@ -184,10 +189,15 @@ schema = Schema(
     pa_schema=record_batch.schema, 
     partition_keys=['dt', 'hh'], 
     primary_keys=['dt', 'hh', 'pk'],
-    options={'bucket': '2'})
+    options={'bucket': '2'},
+    comment='my test table'
+)
 ```
 
 ### Create Table
+
+After building table schema, you can create corresponding table:
+
 ```python
 schema = ...
 catalog.create_table(
@@ -207,30 +217,165 @@ table = catalog.get_table('database_name.table_name')
 
 ## Batch Read
 
-TableRead interface provides parallelly reading for multiple splits. You can set `'max-workers': 'N'` in `catalog_options` 
-to set thread numbers when reading splits. `max-workers` is 1 by default, that means TableRead will read splits sequentially 
-if you doesn't set `max-workers`.
+The reading is divided into Scan Plan and Read Splits stages. A `ReadBuilder` is used to create utils for these stages.
 
 ```python
 table = catalog.get_table('database_name.table_name')
-
-# 1. Create table scan and read
 read_builder = table.new_read_builder()
+```
+
+You can use `PredicateBuilder` to build filters and pushdown them by `ReadBuilder`:
+
+```python
+# Example filter: ('f0' < 3 OR 'f1' > 6) AND 'f3' = 'A'
+
+predicate_builder = read_builder.new_predicate_builder()
+
+predicate1 = predicate_builder.less_than('f0', 3)
+predicate2 = predicate_builder.greater_than('f1', 6)
+predicate3 = predicate_builder.or_predicates([predicate1, predicate2])
+
+predicate4 = predicate_builder.equal('f3', 'A')
+predicate_5 = predicate_builder.and_predicates([predicate3, predicate4])
+
+read_builder = read_builder.with_filter(predicate_5)
+```
+
+
+| Predicate kind        | Predicate method                              | 
+|:----------------------|:----------------------------------------------|
+| p1 and p2             | PredicateBuilder.and_predicates([p1, p2])     |
+| p1 or p2              | PredicateBuilder.or_predicates([p1, p2])      |
+| f = literal           | PredicateBuilder.equal(f, literal)            |
+| f != literal          | PredicateBuilder.not_equal(f, literal)        |
+| f < literal           | PredicateBuilder.less_than(f, literal)        |
+| f <= literal          | PredicateBuilder.less_or_equal(f, literal)    |
+| f > literal           | PredicateBuilder.greater_than(f, literal)     |
+| f >= literal          | PredicateBuilder.greater_or_equal(f, literal) |
+| f is null             | PredicateBuilder.is_null(f)                   |
+| f is not null         | PredicateBuilder.is_not_null(f)               |
+| f.startswith(literal) | PredicateBuilder.startswith(f, literal)       |
+| f.endswith(literal)   | PredicateBuilder.endswith(f, literal)         |
+| f.contains(literal)   | PredicateBuilder.contains(f, literal)         |
+| f is in [l1, l2]      | PredicateBuilder.is_in(f, [l1, l2])           |
+| f is not in [l1, l2]  | PredicateBuilder.is_not_in(f, [l1, l2])       |
+| lower <= f <= upper   | PredicateBuilder.between(f, lower, upper)     |
+
+You can also pushdown projection by `ReadBuilder`:
+
+```python
+# select f3 and f2 columns
+read_builder = read_builder.with_projection(['f3', 'f2'])
+```
+
+Then you can scan plan:
+
+```python
 table_scan = read_builder.new_scan()
-table_read = read_builder.new_read()
+splits = table_scan.splits()
+```
+
+Finally, you can read data from the `splits` to various data format.
 
-# 2. Get splits
-splits = table_scan.plan().splits()
+### Apache Arrow
 
-# 3. Read splits. Support 3 methods:
-# 3.1 Read as pandas.DataFrame
-dataframe = table_read.to_pandas(splits)
+This requires `pyarrow` to be installed.
 
-# 3.2 Read as pyarrow.Table
+You can read all the data into a `pyarrow.Table`:
+
+```python
+table_read = read_builder.new_read()
 pa_table = table_read.to_arrow(splits)
+print(pa_table)
+
+# pyarrow.Table
+# f0: int32
+# f1: string
+# ----
+# f0: [[1,2,3],[4,5,6],...]
+# f1: [["a","b","c"],["d","e","f"],...]
+```
+
+You can also read data into a `pyarrow.RecordBatchReader` and iterate record batches:
 
-# 3.3 Read as pyarrow.RecordBatchReader
-record_batch_reader = table_read.to_arrow_batch_reader(splits)
+```python
+table_read = read_builder.new_read()
+for batch in table_read.to_arrow_batch_reader(splits)
+    print(batch)
+
+# pyarrow.RecordBatch
+# f0: int32
+# f1: string
+# ----
+# f0: [1,2,3]
+# f1: ["a","b","c"]
+```
+
+### Pandas
+
+This requires `pandas` to be installed.
+
+You can read all the data into a `pandas.DataFrame`:
+
+```python
+table_read = read_builder.new_read()
+df = table_read.to_pandas(splits)
+print(df)
+
+#    f0 f1
+# 0   1  a
+# 1   2  b
+# 2   3  c
+# 3   4  d
+# ...
+```
+
+### DuckDB
+
+This requires `duckdb` to be installed.
+
+You can convert the splits into a in-memory DuckDB table and query it:
+
+```python
+table_read = read_builder.new_read()
+duckdb_con = table_read.to_duckdb(splits, 'duckdb_table')
+
+print(duckdb_con.query("SELECT * FROM duckdb_table").fetchdf())
+#    f0 f1
+# 0   1  a
+# 1   2  b
+# 2   3  c
+# 3   4  d
+# ...
+
+print(duckdb_con.query("SELECT * FROM duckdb_table WHERE f0 = 1").fetchdf())
+#    f0 f1
+# 0   1  a
+```
+
+### Ray
+
+This requires `ray` to be installed.
+
+You can convert the splits into a Ray dataset and handle it by Ray API:
+
+```python
+table_read = read_builder.new_read()
+ray_dataset = table_read.to_ray(splits)
+
+print(ray_dataset)
+# MaterializedDataset(num_blocks=1, num_rows=9, schema={f0: int32, f1: string})
+
+print(ray_dataset.take(3))
+# [{'f0': 1, 'f1': 'a'}, {'f0': 2, 'f1': 'b'}, {'f0': 3, 'f1': 'c'}]
+
+print(ray_dataset.to_pandas())
+#    f0 f1
+# 0   1  a
+# 1   2  b
+# 2   3  c
+# 3   4  d
+# ...
 ```
 
 ## Batch Write
@@ -246,12 +391,6 @@ table = catalog.get_table('database_name.table_name')
 
 # 1. Create table write and commit
 write_builder = table.new_batch_write_builder()
-# By default, write data will be appended to table.
-# If you want to overwrite table:
-# write_builder.overwrite()
-# If you want to overwrite partition 'dt=2024-01-01': 
-# write_builder.overwrite({'dt': '2024-01-01'})
-
 table_write = write_builder.new_write()
 table_commit = write_builder.new_commit()
 
@@ -275,7 +414,16 @@ table_commit.commit(commit_messages)
 # 4. Close resources
 table_write.close()
 table_commit.close()
+```
+
+By default, the data will be appended to table. If you want to overwrite table, you should use `TableWrite#overwrite` API:
+
+```python
+# overwrite whole table
+write_builder.overwrite()
 
+# overwrite partition 'dt=2024-01-01'
+write_builder.overwrite({'dt': '2024-01-01'})
 ```
 
 ## Data Types
@@ -290,49 +438,3 @@ table_commit.close()
 | pyarrow.float64()                        | DOUBLE   |
 | pyarrow.string()                         | STRING   |
 | pyarrow.boolean()                        | BOOLEAN  |
-
-## Predicate
-
-You can use predicate to filter data when reading. Example:
-
-```python
-# table data:
-# f0: 0 1 2 3 4
-# f1: 5 6 7 8 9
-read_builder = table.new_read_builder()
-predicate_builder = read_builder.new_predicate_builder()
-
-# build predicate: f0 < 3 && f1 > 5
-predicate1 = predicate_builder.less_than('f0', 1);
-predicate2 = predicate_builder.greater_than('f1', 5);
-predicate = predicate_builder.and_predicates([predicate1, predicate2])
-
-read_builder = read_builder.with_filter(predicate)
-table_scan = read_builder.new_scan()
-table_read = read_builder.new_read()
-splits = table_scan.plan().splits()
-dataframe = table_read.to_pandas(splits)
-
-# result:
-# f0: 1 2
-# f1: 6 7
-```
-
-| Predicate kind        | Predicate method                              | 
-|:----------------------|:----------------------------------------------|
-| p1 and p2             | PredicateBuilder.and_predicates([p1, p2])     |
-| p1 or p2              | PredicateBuilder.or_predicates([p1, p2])      |
-| f = literal           | PredicateBuilder.equal(f, literal)            |
-| f != literal          | PredicateBuilder.not_equal(f, literal)        |
-| f < literal           | PredicateBuilder.less_than(f, literal)        |
-| f <= literal          | PredicateBuilder.less_or_equal(f, literal)    |
-| f > literal           | PredicateBuilder.greater_than(f, literal)     |
-| f >= literal          | PredicateBuilder.greater_or_equal(f, literal) |
-| f is null             | PredicateBuilder.is_null(f)                   |
-| f is not null         | PredicateBuilder.is_not_null(f)               |
-| f.startswith(literal) | PredicateBuilder.startswith(f, literal)       |
-| f.endswith(literal)   | PredicateBuilder.endswith(f, literal)         |
-| f.contains(literal)   | PredicateBuilder.contains(f, literal)         |
-| f is in [l1, l2]      | PredicateBuilder.is_in(f, [l1, l2])           |
-| f is not in [l1, l2]  | PredicateBuilder.is_not_in(f, [l1, l2])       |
-| lower <= f <= upper   | PredicateBuilder.between(f, lower, upper)     |

From 419b02a836da34e2050a1d6c56a57e3ea32d7e99 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 2 Dec 2024 21:09:48 +0800
Subject: [PATCH 093/157] [iceberg] Introduce integration for AWS Glue (#4624)

---
 .../migration/iceberg-compatibility.md        | 11 ++++++
 .../AbstractIcebergCommitCallback.java        | 35 +++++++++---------
 .../apache/paimon/iceberg/IcebergOptions.java |  6 ++++
 .../iceberg/IcebergHiveMetadataCommitter.java |  8 ++---
 .../IcebergHive23MetadataCommitterITCase.java |  9 ++++-
 .../IcebergHive31MetadataCommitterITCase.java |  9 ++++-
 ...cebergHiveMetadataCommitterITCaseBase.java | 36 +++++++++++++++++++
 7 files changed, 92 insertions(+), 22 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index d745607148643..01a03a45264dd 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -383,9 +383,20 @@ you also need to set some (or all) of the following table options when creating
       <td>Boolean</td>
       <td>Should use the legacy manifest version to generate Iceberg's 1.4 manifest files.</td>
     </tr>
+    <tr>
+      <td><h5>metadata.iceberg.hive-client-class</h5></td>
+      <td style="word-wrap: break-word;">org.apache.hadoop.hive.metastore.HiveMetaStoreClient</td>
+      <td>String</td>
+      <td>Hive client class name for Iceberg Hive Catalog.</td>
+    </tr>
     </tbody>
 </table>
 
+## AWS Glue Catalog
+
+You can use Hive Catalog to connect AWS Glue metastore, you can use set `'metadata.iceberg.hive-client-class'` to
+`'com.amazonaws.glue.catalog.metastore.AWSCatalogMetastoreClient'`.
+
 ## AWS Athena
 
 AWS Athena may use old manifest reader to read Iceberg manifest by names, we should let Paimon producing legacy Iceberg
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
index 1b952c1716cf9..7ea6cbe05777e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
@@ -112,22 +112,7 @@ public AbstractIcebergCommitCallback(FileStoreTable table, String commitUser) {
                 break;
             case HADOOP_CATALOG:
             case HIVE_CATALOG:
-                Path dbPath = table.location().getParent();
-                final String dbSuffix = ".db";
-                if (dbPath.getName().endsWith(dbSuffix)) {
-                    String dbName =
-                            dbPath.getName()
-                                    .substring(0, dbPath.getName().length() - dbSuffix.length());
-                    String tableName = table.location().getName();
-                    Path separatePath =
-                            new Path(
-                                    dbPath.getParent(),
-                                    String.format("iceberg/%s/%s/metadata", dbName, tableName));
-                    this.pathFactory = new IcebergPathFactory(separatePath);
-                } else {
-                    throw new UnsupportedOperationException(
-                            "Storage type ICEBERG_WAREHOUSE can only be used on Paimon tables in a Paimon warehouse.");
-                }
+                this.pathFactory = new IcebergPathFactory(catalogTableMetadataPath(table));
                 break;
             default:
                 throw new UnsupportedOperationException(
@@ -152,6 +137,24 @@ public AbstractIcebergCommitCallback(FileStoreTable table, String commitUser) {
         this.manifestList = IcebergManifestList.create(table, pathFactory);
     }
 
+    public static Path catalogTableMetadataPath(FileStoreTable table) {
+        Path icebergDBPath = catalogDatabasePath(table);
+        return new Path(icebergDBPath, String.format("%s/metadata", table.location().getName()));
+    }
+
+    public static Path catalogDatabasePath(FileStoreTable table) {
+        Path dbPath = table.location().getParent();
+        final String dbSuffix = ".db";
+        if (dbPath.getName().endsWith(dbSuffix)) {
+            String dbName =
+                    dbPath.getName().substring(0, dbPath.getName().length() - dbSuffix.length());
+            return new Path(dbPath.getParent(), String.format("iceberg/%s/", dbName));
+        } else {
+            throw new UnsupportedOperationException(
+                    "Storage type ICEBERG_WAREHOUSE can only be used on Paimon tables in a Paimon warehouse.");
+        }
+    }
+
     @Override
     public void close() throws Exception {}
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
index c0ceed97ba8cf..4b59e29c8c333 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
@@ -84,6 +84,12 @@ public class IcebergOptions {
                     .withDescription(
                             "Should use the legacy manifest version to generate Iceberg's 1.4 manifest files.");
 
+    public static final ConfigOption<String> HIVE_CLIENT_CLASS =
+            key("metadata.iceberg.hive-client-class")
+                    .stringType()
+                    .defaultValue("org.apache.hadoop.hive.metastore.HiveMetaStoreClient")
+                    .withDescription("Hive client class name for Iceberg Hive Catalog.");
+
     /** Where to store Iceberg metadata. */
     public enum StorageType implements DescribedEnum {
         DISABLED("disabled", "Disable Iceberg compatibility support."),
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitter.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitter.java
index d913f729e3518..ddd21384cbc83 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitter.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitter.java
@@ -22,7 +22,6 @@
 import org.apache.paimon.client.ClientPool;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.hive.HiveCatalog;
-import org.apache.paimon.hive.HiveCatalogFactory;
 import org.apache.paimon.hive.HiveTypeUtils;
 import org.apache.paimon.hive.pool.CachedClientPool;
 import org.apache.paimon.options.Options;
@@ -49,6 +48,8 @@
 import java.util.HashMap;
 import java.util.stream.Collectors;
 
+import static org.apache.paimon.iceberg.AbstractIcebergCommitCallback.catalogDatabasePath;
+
 /**
  * {@link IcebergMetadataCommitter} to commit Iceberg metadata to Hive metastore, so the table can
  * be visited by Iceberg's Hive catalog.
@@ -98,9 +99,7 @@ public IcebergHiveMetadataCommitter(FileStoreTable table) {
 
         this.clients =
                 new CachedClientPool(
-                        hiveConf,
-                        options,
-                        HiveCatalogFactory.METASTORE_CLIENT_CLASS.defaultValue());
+                        hiveConf, options, options.getString(IcebergOptions.HIVE_CLIENT_CLASS));
     }
 
     @Override
@@ -158,6 +157,7 @@ private boolean databaseExists(String databaseName) throws Exception {
     private void createDatabase(String databaseName) throws Exception {
         Database database = new Database();
         database.setName(databaseName);
+        database.setLocationUri(catalogDatabasePath(table).toString());
         clients.execute(client -> client.createDatabase(database));
     }
 
diff --git a/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/iceberg/IcebergHive23MetadataCommitterITCase.java b/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/iceberg/IcebergHive23MetadataCommitterITCase.java
index a9e4ba945440e..7d726e75a17d2 100644
--- a/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/iceberg/IcebergHive23MetadataCommitterITCase.java
+++ b/paimon-hive/paimon-hive-connector-2.3/src/test/java/org/apache/paimon/iceberg/IcebergHive23MetadataCommitterITCase.java
@@ -18,5 +18,12 @@
 
 package org.apache.paimon.iceberg;
 
+import org.apache.paimon.hive.CreateFailHiveMetaStoreClient;
+
 /** IT cases for {@link IcebergHiveMetadataCommitter} in Hive 2.3. */
-public class IcebergHive23MetadataCommitterITCase extends IcebergHiveMetadataCommitterITCaseBase {}
+public class IcebergHive23MetadataCommitterITCase extends IcebergHiveMetadataCommitterITCaseBase {
+    @Override
+    protected String createFailHiveMetaStoreClient() {
+        return CreateFailHiveMetaStoreClient.class.getName();
+    }
+}
diff --git a/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/iceberg/IcebergHive31MetadataCommitterITCase.java b/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/iceberg/IcebergHive31MetadataCommitterITCase.java
index 6f4b0afd1ae12..0634adfad3576 100644
--- a/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/iceberg/IcebergHive31MetadataCommitterITCase.java
+++ b/paimon-hive/paimon-hive-connector-3.1/src/test/java/org/apache/paimon/iceberg/IcebergHive31MetadataCommitterITCase.java
@@ -18,5 +18,12 @@
 
 package org.apache.paimon.iceberg;
 
+import org.apache.paimon.hive.CreateFailHiveMetaStoreClient;
+
 /** IT cases for {@link IcebergHiveMetadataCommitter} in Hive 3.1. */
-public class IcebergHive31MetadataCommitterITCase extends IcebergHiveMetadataCommitterITCaseBase {}
+public class IcebergHive31MetadataCommitterITCase extends IcebergHiveMetadataCommitterITCaseBase {
+    @Override
+    protected String createFailHiveMetaStoreClient() {
+        return CreateFailHiveMetaStoreClient.class.getName();
+    }
+}
diff --git a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitterITCaseBase.java b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitterITCaseBase.java
index fab22775751b0..d0c64c5d3b7fc 100644
--- a/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitterITCaseBase.java
+++ b/paimon-hive/paimon-hive-connector-common/src/test/java/org/apache/paimon/iceberg/IcebergHiveMetadataCommitterITCaseBase.java
@@ -104,6 +104,12 @@ public void testPrimaryKeyTable() throws Exception {
                         Row.of(2, 1, "cat"),
                         Row.of(2, 2, "elephant")),
                 collect(tEnv.executeSql("SELECT * FROM my_iceberg.test_db.t ORDER BY pt, id")));
+
+        Assert.assertTrue(
+                hiveShell
+                        .executeQuery("DESC DATABASE EXTENDED test_db")
+                        .toString()
+                        .contains("iceberg/test_db"));
     }
 
     @Test
@@ -150,6 +156,36 @@ public void testAppendOnlyTable() throws Exception {
                                 "SELECT data, id, pt FROM my_iceberg.test_db.t WHERE id > 1 ORDER BY pt, id")));
     }
 
+    @Test
+    public void testCustomMetastoreClass() {
+        TableEnvironment tEnv =
+                TableEnvironmentImpl.create(
+                        EnvironmentSettings.newInstance().inBatchMode().build());
+        tEnv.executeSql(
+                "CREATE CATALOG my_paimon WITH ( 'type' = 'paimon', 'warehouse' = '"
+                        + path
+                        + "' )");
+        tEnv.executeSql("CREATE DATABASE my_paimon.test_db");
+        tEnv.executeSql(
+                String.format(
+                        "CREATE TABLE my_paimon.test_db.t ( pt INT, id INT, data STRING ) PARTITIONED BY (pt) WITH "
+                                + "( "
+                                + "'metadata.iceberg.storage' = 'hive-catalog', "
+                                + "'metadata.iceberg.uri' = '', "
+                                + "'file.format' = 'avro', "
+                                + "'metadata.iceberg.hive-client-class' = '%s')",
+                        createFailHiveMetaStoreClient()));
+        Assert.assertThrows(
+                Exception.class,
+                () ->
+                        tEnv.executeSql(
+                                        "INSERT INTO my_paimon.test_db.t VALUES "
+                                                + "(1, 1, 'apple'), (1, 2, 'pear'), (2, 1, 'cat'), (2, 2, 'dog')")
+                                .await());
+    }
+
+    protected abstract String createFailHiveMetaStoreClient();
+
     private List<Row> collect(TableResult result) throws Exception {
         List<Row> rows = new ArrayList<>();
         try (CloseableIterator<Row> it = result.collect()) {

From 6fb887f47f2e79f6b3142f094b20b6d7a3f86846 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Mon, 2 Dec 2024 21:11:23 +0800
Subject: [PATCH 094/157] [flink] Avoid deprecated usage on TableSchema,
 DataType and DescriptorProperties (#4611)

---
 .../apache/paimon/flink/DataCatalogTable.java | 115 +++++++++++-----
 .../org/apache/paimon/flink/FlinkCatalog.java |  55 ++++----
 .../paimon/flink/FlinkGenericCatalog.java     |   6 -
 .../paimon/flink/SystemCatalogTable.java      |  12 +-
 .../utils/FlinkCatalogPropertiesUtil.java     | 102 ++++----------
 .../utils/FlinkDescriptorProperties.java      |  99 +++++++++++++
 .../flink/FlinkCatalogPropertiesUtilTest.java | 130 +++++++++++++-----
 .../apache/paimon/flink/FlinkCatalogTest.java |   9 +-
 8 files changed, 342 insertions(+), 186 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkDescriptorProperties.java

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/DataCatalogTable.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/DataCatalogTable.java
index 019d7bd6892fe..e141581b476ba 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/DataCatalogTable.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/DataCatalogTable.java
@@ -23,33 +23,55 @@
 import org.apache.paimon.types.DataField;
 
 import org.apache.flink.table.api.Schema;
-import org.apache.flink.table.api.TableColumn;
-import org.apache.flink.table.api.TableSchema;
-import org.apache.flink.table.api.constraints.UniqueConstraint;
 import org.apache.flink.table.catalog.CatalogBaseTable;
 import org.apache.flink.table.catalog.CatalogTable;
-import org.apache.flink.table.catalog.CatalogTableImpl;
 
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.Optional;
 import java.util.stream.Collectors;
 
-/** A {@link CatalogTableImpl} to wrap {@link FileStoreTable}. */
-public class DataCatalogTable extends CatalogTableImpl {
+import static org.apache.flink.util.Preconditions.checkArgument;
+import static org.apache.flink.util.Preconditions.checkNotNull;
+
+/** A {@link CatalogTable} to wrap {@link FileStoreTable}. */
+public class DataCatalogTable implements CatalogTable {
+    // Schema of the table (column names and types)
+    private final Schema schema;
+
+    // Partition keys if this is a partitioned table. It's an empty set if the table is not
+    // partitioned
+    private final List<String> partitionKeys;
+
+    // Properties of the table
+    private final Map<String, String> options;
+
+    // Comment of the table
+    private final String comment;
 
     private final Table table;
     private final Map<String, String> nonPhysicalColumnComments;
 
     public DataCatalogTable(
             Table table,
-            TableSchema tableSchema,
+            Schema resolvedSchema,
             List<String> partitionKeys,
-            Map<String, String> properties,
+            Map<String, String> options,
             String comment,
             Map<String, String> nonPhysicalColumnComments) {
-        super(tableSchema, partitionKeys, properties, comment);
+        this.schema = resolvedSchema;
+        this.partitionKeys = checkNotNull(partitionKeys, "partitionKeys cannot be null");
+        this.options = checkNotNull(options, "options cannot be null");
+
+        checkArgument(
+                options.entrySet().stream()
+                        .allMatch(e -> e.getKey() != null && e.getValue() != null),
+                "properties cannot have null keys or values");
+
+        this.comment = comment;
+
         this.table = table;
         this.nonPhysicalColumnComments = nonPhysicalColumnComments;
     }
@@ -66,32 +88,30 @@ public Schema getUnresolvedSchema() {
                         .filter(dataField -> dataField.description() != null)
                         .collect(Collectors.toMap(DataField::name, DataField::description));
 
-        return toSchema(getSchema(), columnComments);
+        return toSchema(schema, columnComments);
     }
 
-    /** Copied from {@link TableSchema#toSchema(Map)} to support versions lower than 1.17. */
-    private Schema toSchema(TableSchema tableSchema, Map<String, String> comments) {
+    private Schema toSchema(Schema tableSchema, Map<String, String> comments) {
         final Schema.Builder builder = Schema.newBuilder();
-
         tableSchema
-                .getTableColumns()
+                .getColumns()
                 .forEach(
                         column -> {
-                            if (column instanceof TableColumn.PhysicalColumn) {
-                                final TableColumn.PhysicalColumn c =
-                                        (TableColumn.PhysicalColumn) column;
-                                builder.column(c.getName(), c.getType());
-                            } else if (column instanceof TableColumn.MetadataColumn) {
-                                final TableColumn.MetadataColumn c =
-                                        (TableColumn.MetadataColumn) column;
+                            if (column instanceof Schema.UnresolvedPhysicalColumn) {
+                                final Schema.UnresolvedPhysicalColumn c =
+                                        (Schema.UnresolvedPhysicalColumn) column;
+                                builder.column(c.getName(), c.getDataType());
+                            } else if (column instanceof Schema.UnresolvedMetadataColumn) {
+                                final Schema.UnresolvedMetadataColumn c =
+                                        (Schema.UnresolvedMetadataColumn) column;
                                 builder.columnByMetadata(
                                         c.getName(),
-                                        c.getType(),
-                                        c.getMetadataAlias().orElse(null),
+                                        c.getDataType(),
+                                        c.getMetadataKey(),
                                         c.isVirtual());
-                            } else if (column instanceof TableColumn.ComputedColumn) {
-                                final TableColumn.ComputedColumn c =
-                                        (TableColumn.ComputedColumn) column;
+                            } else if (column instanceof Schema.UnresolvedComputedColumn) {
+                                final Schema.UnresolvedComputedColumn c =
+                                        (Schema.UnresolvedComputedColumn) column;
                                 builder.columnByExpression(c.getName(), c.getExpression());
                             } else {
                                 throw new IllegalArgumentException(
@@ -104,19 +124,16 @@ private Schema toSchema(TableSchema tableSchema, Map<String, String> comments) {
                                 builder.withComment(nonPhysicalColumnComments.get(colName));
                             }
                         });
-
         tableSchema
                 .getWatermarkSpecs()
                 .forEach(
                         spec ->
                                 builder.watermark(
-                                        spec.getRowtimeAttribute(), spec.getWatermarkExpr()));
-
+                                        spec.getColumnName(), spec.getWatermarkExpression()));
         if (tableSchema.getPrimaryKey().isPresent()) {
-            UniqueConstraint primaryKey = tableSchema.getPrimaryKey().get();
-            builder.primaryKeyNamed(primaryKey.getName(), primaryKey.getColumns());
+            Schema.UnresolvedPrimaryKey primaryKey = tableSchema.getPrimaryKey().get();
+            builder.primaryKeyNamed(primaryKey.getConstraintName(), primaryKey.getColumnNames());
         }
-
         return builder.build();
     }
 
@@ -124,7 +141,7 @@ private Schema toSchema(TableSchema tableSchema, Map<String, String> comments) {
     public CatalogBaseTable copy() {
         return new DataCatalogTable(
                 table,
-                getSchema().copy(),
+                schema,
                 new ArrayList<>(getPartitionKeys()),
                 new HashMap<>(getOptions()),
                 getComment(),
@@ -135,10 +152,40 @@ public CatalogBaseTable copy() {
     public CatalogTable copy(Map<String, String> options) {
         return new DataCatalogTable(
                 table,
-                getSchema(),
+                schema,
                 getPartitionKeys(),
                 options,
                 getComment(),
                 nonPhysicalColumnComments);
     }
+
+    @Override
+    public Optional<String> getDescription() {
+        return Optional.of(getComment());
+    }
+
+    @Override
+    public Optional<String> getDetailedDescription() {
+        return Optional.of("This is a catalog table in an im-memory catalog");
+    }
+
+    @Override
+    public boolean isPartitioned() {
+        return !partitionKeys.isEmpty();
+    }
+
+    @Override
+    public List<String> getPartitionKeys() {
+        return partitionKeys;
+    }
+
+    @Override
+    public Map<String, String> getOptions() {
+        return options;
+    }
+
+    @Override
+    public String getComment() {
+        return comment != null ? comment : "";
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
index c67e79c1c06b7..3a7f9790ccca1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkCatalog.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.catalog.Identifier;
 import org.apache.paimon.flink.procedure.ProcedureUtil;
 import org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil;
+import org.apache.paimon.flink.utils.FlinkDescriptorProperties;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.PartitionEntry;
 import org.apache.paimon.operation.FileStoreCommit;
@@ -46,7 +47,6 @@
 import org.apache.paimon.view.View;
 import org.apache.paimon.view.ViewImpl;
 
-import org.apache.flink.table.api.TableSchema;
 import org.apache.flink.table.catalog.AbstractCatalog;
 import org.apache.flink.table.catalog.CatalogBaseTable;
 import org.apache.flink.table.catalog.CatalogDatabase;
@@ -96,7 +96,6 @@
 import org.apache.flink.table.catalog.exceptions.TableNotPartitionedException;
 import org.apache.flink.table.catalog.stats.CatalogColumnStatistics;
 import org.apache.flink.table.catalog.stats.CatalogTableStatistics;
-import org.apache.flink.table.descriptors.DescriptorProperties;
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.factories.Factory;
 import org.apache.flink.table.procedures.Procedure;
@@ -121,13 +120,6 @@
 import java.util.function.Function;
 import java.util.stream.Collectors;
 
-import static org.apache.flink.table.descriptors.DescriptorProperties.COMMENT;
-import static org.apache.flink.table.descriptors.DescriptorProperties.NAME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_ROWTIME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_EXPR;
-import static org.apache.flink.table.descriptors.Schema.SCHEMA;
 import static org.apache.flink.table.factories.FactoryUtil.CONNECTOR;
 import static org.apache.flink.table.types.utils.TypeConversions.fromLogicalToDataType;
 import static org.apache.flink.table.utils.EncodingUtils.decodeBase64ToBytes;
@@ -152,11 +144,18 @@
 import static org.apache.paimon.flink.LogicalTypeConversion.toLogicalType;
 import static org.apache.paimon.flink.log.LogStoreRegister.registerLogSystem;
 import static org.apache.paimon.flink.log.LogStoreRegister.unRegisterLogSystem;
+import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.SCHEMA;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.compoundKey;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.deserializeWatermarkSpec;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.nonPhysicalColumnsCount;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.serializeNewWatermarkSpec;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.COMMENT;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.NAME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_ROWTIME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_EXPR;
 import static org.apache.paimon.flink.utils.TableStatsUtil.createTableColumnStats;
 import static org.apache.paimon.flink.utils.TableStatsUtil.createTableStats;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
@@ -1008,18 +1007,18 @@ private static void validateAlterTable(CatalogBaseTable ct1, CatalogBaseTable ct
         }
         // materialized table is not resolved at this time.
         if (!table1IsMaterialized) {
-            org.apache.flink.table.api.TableSchema ts1 = ct1.getSchema();
-            org.apache.flink.table.api.TableSchema ts2 = ct2.getSchema();
+            org.apache.flink.table.api.Schema ts1 = ct1.getUnresolvedSchema();
+            org.apache.flink.table.api.Schema ts2 = ct2.getUnresolvedSchema();
             boolean pkEquality = false;
 
             if (ts1.getPrimaryKey().isPresent() && ts2.getPrimaryKey().isPresent()) {
                 pkEquality =
                         Objects.equals(
-                                        ts1.getPrimaryKey().get().getType(),
-                                        ts2.getPrimaryKey().get().getType())
+                                        ts1.getPrimaryKey().get().getConstraintName(),
+                                        ts2.getPrimaryKey().get().getConstraintName())
                                 && Objects.equals(
-                                        ts1.getPrimaryKey().get().getColumns(),
-                                        ts2.getPrimaryKey().get().getColumns());
+                                        ts1.getPrimaryKey().get().getColumnNames(),
+                                        ts2.getPrimaryKey().get().getColumnNames());
             } else if (!ts1.getPrimaryKey().isPresent() && !ts2.getPrimaryKey().isPresent()) {
                 pkEquality = true;
             }
@@ -1063,7 +1062,8 @@ public final void close() throws CatalogException {
     private CatalogBaseTable toCatalogTable(Table table) {
         Map<String, String> newOptions = new HashMap<>(table.options());
 
-        TableSchema.Builder builder = TableSchema.builder();
+        org.apache.flink.table.api.Schema.Builder builder =
+                org.apache.flink.table.api.Schema.newBuilder();
         Map<String, String> nonPhysicalColumnComments = new HashMap<>();
 
         // add columns
@@ -1078,10 +1078,10 @@ private CatalogBaseTable toCatalogTable(Table table) {
             if (optionalName == null || physicalColumns.contains(optionalName)) {
                 // build physical column from table row field
                 RowType.RowField field = physicalRowFields.get(physicalColumnIndex++);
-                builder.field(field.getName(), fromLogicalToDataType(field.getType()));
+                builder.column(field.getName(), fromLogicalToDataType(field.getType()));
             } else {
                 // build non-physical column from options
-                builder.add(deserializeNonPhysicalColumn(newOptions, i));
+                deserializeNonPhysicalColumn(newOptions, i, builder);
                 if (newOptions.containsKey(compoundKey(SCHEMA, i, COMMENT))) {
                     nonPhysicalColumnComments.put(
                             optionalName, newOptions.get(compoundKey(SCHEMA, i, COMMENT)));
@@ -1093,22 +1093,18 @@ private CatalogBaseTable toCatalogTable(Table table) {
         // extract watermark information
         if (newOptions.keySet().stream()
                 .anyMatch(key -> key.startsWith(compoundKey(SCHEMA, WATERMARK)))) {
-            builder.watermark(deserializeWatermarkSpec(newOptions));
+            deserializeWatermarkSpec(newOptions, builder);
         }
 
         // add primary keys
         if (table.primaryKeys().size() > 0) {
-            builder.primaryKey(
-                    table.primaryKeys().stream().collect(Collectors.joining("_", "PK_", "")),
-                    table.primaryKeys().toArray(new String[0]));
+            builder.primaryKey(table.primaryKeys());
         }
 
-        TableSchema schema = builder.build();
+        org.apache.flink.table.api.Schema schema = builder.build();
 
         // remove schema from options
-        DescriptorProperties removeProperties = new DescriptorProperties(false);
-        removeProperties.putTableSchema(SCHEMA, schema);
-        removeProperties.asMap().keySet().forEach(newOptions::remove);
+        FlinkDescriptorProperties.removeSchemaKeys(SCHEMA, schema, newOptions);
 
         Options options = Options.fromMap(newOptions);
         if (TableType.MATERIALIZED_TABLE == options.get(CoreOptions.TYPE)) {
@@ -1124,7 +1120,10 @@ private CatalogBaseTable toCatalogTable(Table table) {
     }
 
     private CatalogMaterializedTable buildMaterializedTable(
-            Table table, Map<String, String> newOptions, TableSchema schema, Options options) {
+            Table table,
+            Map<String, String> newOptions,
+            org.apache.flink.table.api.Schema schema,
+            Options options) {
         String definitionQuery = options.get(MATERIALIZED_TABLE_DEFINITION_QUERY);
         IntervalFreshness freshness =
                 IntervalFreshness.of(
@@ -1148,7 +1147,7 @@ private CatalogMaterializedTable buildMaterializedTable(
         // remove materialized table related options
         allMaterializedTableAttributes().forEach(newOptions::remove);
         return CatalogMaterializedTable.newBuilder()
-                .schema(schema.toSchema())
+                .schema(schema)
                 .comment(table.comment().orElse(""))
                 .partitionKeys(table.partitionKeys())
                 .options(newOptions)
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkGenericCatalog.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkGenericCatalog.java
index 37bed2d0480f5..75af5917bb492 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkGenericCatalog.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/FlinkGenericCatalog.java
@@ -48,7 +48,6 @@
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.factories.Factory;
 import org.apache.flink.table.factories.FunctionDefinitionFactory;
-import org.apache.flink.table.factories.TableFactory;
 import org.apache.flink.table.procedures.Procedure;
 
 import java.util.List;
@@ -86,11 +85,6 @@ public Optional<Factory> getFactory() {
                 new FlinkGenericTableFactory(paimon.getFactory().get(), flink.getFactory().get()));
     }
 
-    @Override
-    public Optional<TableFactory> getTableFactory() {
-        return flink.getTableFactory();
-    }
-
     @Override
     public Optional<FunctionDefinitionFactory> getFunctionDefinitionFactory() {
         return flink.getFunctionDefinitionFactory();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/SystemCatalogTable.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/SystemCatalogTable.java
index d5d843d91bb10..f88a808713c24 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/SystemCatalogTable.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/SystemCatalogTable.java
@@ -22,7 +22,6 @@
 import org.apache.paimon.table.system.AuditLogTable;
 
 import org.apache.flink.table.api.Schema;
-import org.apache.flink.table.api.WatermarkSpec;
 import org.apache.flink.table.catalog.CatalogTable;
 import org.apache.flink.table.types.utils.TypeConversions;
 
@@ -32,11 +31,11 @@
 import java.util.Map;
 import java.util.Optional;
 
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK;
-import static org.apache.flink.table.descriptors.Schema.SCHEMA;
 import static org.apache.paimon.flink.LogicalTypeConversion.toLogicalType;
+import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.SCHEMA;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.compoundKey;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.deserializeWatermarkSpec;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK;
 
 /** A {@link CatalogTable} to represent system table. */
 public class SystemCatalogTable implements CatalogTable {
@@ -60,11 +59,8 @@ public Schema getUnresolvedSchema() {
             Map<String, String> newOptions = new HashMap<>(table.options());
             if (newOptions.keySet().stream()
                     .anyMatch(key -> key.startsWith(compoundKey(SCHEMA, WATERMARK)))) {
-                WatermarkSpec watermarkSpec = deserializeWatermarkSpec(newOptions);
-                return builder.watermark(
-                                watermarkSpec.getRowtimeAttribute(),
-                                watermarkSpec.getWatermarkExpr())
-                        .build();
+                deserializeWatermarkSpec(newOptions, builder);
+                return builder.build();
             }
         }
         return builder.build();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkCatalogPropertiesUtil.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkCatalogPropertiesUtil.java
index b0f99a6e89e43..fa84a1ca070d0 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkCatalogPropertiesUtil.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkCatalogPropertiesUtil.java
@@ -20,8 +20,7 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableSet;
 
-import org.apache.flink.table.api.TableColumn;
-import org.apache.flink.table.api.WatermarkSpec;
+import org.apache.flink.table.api.Schema;
 import org.apache.flink.table.catalog.Column;
 import org.apache.flink.table.catalog.ResolvedSchema;
 import org.apache.flink.table.types.DataType;
@@ -36,48 +35,23 @@
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
-import static org.apache.flink.table.descriptors.DescriptorProperties.COMMENT;
-import static org.apache.flink.table.descriptors.DescriptorProperties.DATA_TYPE;
-import static org.apache.flink.table.descriptors.DescriptorProperties.EXPR;
-import static org.apache.flink.table.descriptors.DescriptorProperties.METADATA;
-import static org.apache.flink.table.descriptors.DescriptorProperties.NAME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.VIRTUAL;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_ROWTIME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_EXPR;
-import static org.apache.flink.table.descriptors.Schema.SCHEMA;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.COMMENT;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.DATA_TYPE;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.EXPR;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.METADATA;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.NAME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.VIRTUAL;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_ROWTIME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_EXPR;
 
 /**
  * Utilities for ser/deserializing non-physical columns and watermark into/from a map of string
  * properties.
  */
 public class FlinkCatalogPropertiesUtil {
-
-    public static Map<String, String> serializeNonPhysicalColumns(
-            Map<String, Integer> indexMap, List<TableColumn> nonPhysicalColumns) {
-        Map<String, String> serialized = new HashMap<>();
-        for (TableColumn c : nonPhysicalColumns) {
-            int index = indexMap.get(c.getName());
-            serialized.put(compoundKey(SCHEMA, index, NAME), c.getName());
-            serialized.put(
-                    compoundKey(SCHEMA, index, DATA_TYPE),
-                    c.getType().getLogicalType().asSerializableString());
-            if (c instanceof TableColumn.ComputedColumn) {
-                TableColumn.ComputedColumn computedColumn = (TableColumn.ComputedColumn) c;
-                serialized.put(compoundKey(SCHEMA, index, EXPR), computedColumn.getExpression());
-            } else {
-                TableColumn.MetadataColumn metadataColumn = (TableColumn.MetadataColumn) c;
-                serialized.put(
-                        compoundKey(SCHEMA, index, METADATA),
-                        metadataColumn.getMetadataAlias().orElse(metadataColumn.getName()));
-                serialized.put(
-                        compoundKey(SCHEMA, index, VIRTUAL),
-                        Boolean.toString(metadataColumn.isVirtual()));
-            }
-        }
-        return serialized;
-    }
+    public static final String SCHEMA = "schema";
 
     /** Serialize non-physical columns of new api. */
     public static Map<String, String> serializeNonPhysicalNewColumns(ResolvedSchema schema) {
@@ -119,22 +93,6 @@ public static Map<String, String> serializeNonPhysicalNewColumns(ResolvedSchema
         return serialized;
     }
 
-    public static Map<String, String> serializeWatermarkSpec(WatermarkSpec watermarkSpec) {
-        Map<String, String> serializedWatermarkSpec = new HashMap<>();
-        String watermarkPrefix = compoundKey(SCHEMA, WATERMARK, 0);
-        serializedWatermarkSpec.put(
-                compoundKey(watermarkPrefix, WATERMARK_ROWTIME),
-                watermarkSpec.getRowtimeAttribute());
-        serializedWatermarkSpec.put(
-                compoundKey(watermarkPrefix, WATERMARK_STRATEGY_EXPR),
-                watermarkSpec.getWatermarkExpr());
-        serializedWatermarkSpec.put(
-                compoundKey(watermarkPrefix, WATERMARK_STRATEGY_DATA_TYPE),
-                watermarkSpec.getWatermarkExprOutputType().getLogicalType().asSerializableString());
-
-        return serializedWatermarkSpec;
-    }
-
     public static Map<String, String> serializeNewWatermarkSpec(
             org.apache.flink.table.catalog.WatermarkSpec watermarkSpec) {
         Map<String, String> serializedWatermarkSpec = new HashMap<>();
@@ -219,7 +177,8 @@ private static boolean isColumnNameKey(String key) {
                 && SCHEMA_COLUMN_NAME_SUFFIX.matcher(key.substring(SCHEMA.length() + 1)).matches();
     }
 
-    public static TableColumn deserializeNonPhysicalColumn(Map<String, String> options, int index) {
+    public static void deserializeNonPhysicalColumn(
+            Map<String, String> options, int index, Schema.Builder builder) {
         String nameKey = compoundKey(SCHEMA, index, NAME);
         String dataTypeKey = compoundKey(SCHEMA, index, DATA_TYPE);
         String exprKey = compoundKey(SCHEMA, index, EXPR);
@@ -227,45 +186,42 @@ public static TableColumn deserializeNonPhysicalColumn(Map<String, String> optio
         String virtualKey = compoundKey(SCHEMA, index, VIRTUAL);
 
         String name = options.get(nameKey);
-        DataType dataType =
-                TypeConversions.fromLogicalToDataType(
-                        LogicalTypeParser.parse(options.get(dataTypeKey)));
 
-        TableColumn column;
         if (options.containsKey(exprKey)) {
-            column = TableColumn.computed(name, dataType, options.get(exprKey));
+            final String expr = options.get(exprKey);
+            builder.columnByExpression(name, expr);
         } else if (options.containsKey(metadataKey)) {
             String metadataAlias = options.get(metadataKey);
             boolean isVirtual = Boolean.parseBoolean(options.get(virtualKey));
-            column =
-                    metadataAlias.equals(name)
-                            ? TableColumn.metadata(name, dataType, isVirtual)
-                            : TableColumn.metadata(name, dataType, metadataAlias, isVirtual);
+            DataType dataType =
+                    TypeConversions.fromLogicalToDataType(
+                            LogicalTypeParser.parse(
+                                    options.get(dataTypeKey),
+                                    Thread.currentThread().getContextClassLoader()));
+            if (metadataAlias.equals(name)) {
+                builder.columnByMetadata(name, dataType, isVirtual);
+            } else {
+                builder.columnByMetadata(name, dataType, metadataAlias, isVirtual);
+            }
         } else {
             throw new RuntimeException(
                     String.format(
                             "Failed to build non-physical column. Current index is %s, options are %s",
                             index, options));
         }
-
-        return column;
     }
 
-    public static WatermarkSpec deserializeWatermarkSpec(Map<String, String> options) {
+    public static void deserializeWatermarkSpec(
+            Map<String, String> options, Schema.Builder builder) {
         String watermarkPrefixKey = compoundKey(SCHEMA, WATERMARK);
 
         String rowtimeKey = compoundKey(watermarkPrefixKey, 0, WATERMARK_ROWTIME);
         String exprKey = compoundKey(watermarkPrefixKey, 0, WATERMARK_STRATEGY_EXPR);
-        String dataTypeKey = compoundKey(watermarkPrefixKey, 0, WATERMARK_STRATEGY_DATA_TYPE);
 
         String rowtimeAttribute = options.get(rowtimeKey);
         String watermarkExpressionString = options.get(exprKey);
-        DataType watermarkExprOutputType =
-                TypeConversions.fromLogicalToDataType(
-                        LogicalTypeParser.parse(options.get(dataTypeKey)));
 
-        return new WatermarkSpec(
-                rowtimeAttribute, watermarkExpressionString, watermarkExprOutputType);
+        builder.watermark(rowtimeAttribute, watermarkExpressionString);
     }
 
     public static String compoundKey(Object... components) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkDescriptorProperties.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkDescriptorProperties.java
new file mode 100644
index 0000000000000..edc73ca7bf41f
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/utils/FlinkDescriptorProperties.java
@@ -0,0 +1,99 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.utils;
+
+import org.apache.flink.table.api.Schema;
+
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+
+import static org.apache.flink.util.Preconditions.checkNotNull;
+
+/**
+ * Utility class for having a unified string-based representation of Table API related classes such
+ * as Schema, TypeInformation, etc.
+ *
+ * <p>Note to implementers: Please try to reuse key names as much as possible. Key-names should be
+ * hierarchical and lower case. Use "-" instead of dots or camel case. E.g.,
+ * connector.schema.start-from = from-earliest. Try not to use the higher level in a key-name. E.g.,
+ * instead of connector.kafka.kafka-version use connector.kafka.version.
+ *
+ * <p>Properties with key normalization enabled contain only lower-case keys.
+ */
+public class FlinkDescriptorProperties {
+
+    public static final String NAME = "name";
+
+    public static final String DATA_TYPE = "data-type";
+
+    public static final String EXPR = "expr";
+
+    public static final String METADATA = "metadata";
+
+    public static final String VIRTUAL = "virtual";
+
+    public static final String WATERMARK = "watermark";
+
+    public static final String WATERMARK_ROWTIME = "rowtime";
+
+    public static final String WATERMARK_STRATEGY = "strategy";
+
+    public static final String WATERMARK_STRATEGY_EXPR = WATERMARK_STRATEGY + '.' + EXPR;
+
+    public static final String WATERMARK_STRATEGY_DATA_TYPE = WATERMARK_STRATEGY + '.' + DATA_TYPE;
+
+    public static final String PRIMARY_KEY_NAME = "primary-key.name";
+
+    public static final String PRIMARY_KEY_COLUMNS = "primary-key.columns";
+
+    public static final String COMMENT = "comment";
+
+    public static void removeSchemaKeys(String key, Schema schema, Map<String, String> options) {
+        checkNotNull(key);
+        checkNotNull(schema);
+
+        List<String> subKeys = Arrays.asList(NAME, DATA_TYPE, EXPR, METADATA, VIRTUAL);
+        for (int idx = 0; idx < schema.getColumns().size(); idx++) {
+            for (String subKey : subKeys) {
+                options.remove(key + '.' + idx + '.' + subKey);
+            }
+        }
+
+        if (!schema.getWatermarkSpecs().isEmpty()) {
+            subKeys =
+                    Arrays.asList(
+                            WATERMARK_ROWTIME,
+                            WATERMARK_STRATEGY_EXPR,
+                            WATERMARK_STRATEGY_DATA_TYPE);
+            for (int idx = 0; idx < schema.getWatermarkSpecs().size(); idx++) {
+                for (String subKey : subKeys) {
+                    options.remove(key + '.' + WATERMARK + '.' + idx + '.' + subKey);
+                }
+            }
+        }
+
+        schema.getPrimaryKey()
+                .ifPresent(
+                        pk -> {
+                            options.remove(key + '.' + PRIMARY_KEY_NAME);
+                            options.remove(key + '.' + PRIMARY_KEY_COLUMNS);
+                        });
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogPropertiesUtilTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogPropertiesUtilTest.java
index 9268a236b6cb6..e32150b1fe822 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogPropertiesUtilTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogPropertiesUtilTest.java
@@ -21,27 +21,35 @@
 import org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil;
 
 import org.apache.flink.table.api.DataTypes;
-import org.apache.flink.table.api.TableColumn;
-import org.apache.flink.table.api.WatermarkSpec;
+import org.apache.flink.table.api.Schema;
+import org.apache.flink.table.catalog.Column;
+import org.apache.flink.table.catalog.ResolvedSchema;
+import org.apache.flink.table.catalog.WatermarkSpec;
+import org.apache.flink.table.expressions.Expression;
+import org.apache.flink.table.expressions.ExpressionVisitor;
+import org.apache.flink.table.expressions.ResolvedExpression;
+import org.apache.flink.table.expressions.SqlCallExpression;
+import org.apache.flink.table.types.DataType;
 import org.junit.jupiter.api.Test;
 
 import java.util.ArrayList;
 import java.util.Arrays;
+import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 
-import static org.apache.flink.table.descriptors.DescriptorProperties.DATA_TYPE;
-import static org.apache.flink.table.descriptors.DescriptorProperties.EXPR;
-import static org.apache.flink.table.descriptors.DescriptorProperties.METADATA;
-import static org.apache.flink.table.descriptors.DescriptorProperties.NAME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.VIRTUAL;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_ROWTIME;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
-import static org.apache.flink.table.descriptors.DescriptorProperties.WATERMARK_STRATEGY_EXPR;
-import static org.apache.flink.table.descriptors.Schema.SCHEMA;
+import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.SCHEMA;
 import static org.apache.paimon.flink.utils.FlinkCatalogPropertiesUtil.compoundKey;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.DATA_TYPE;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.EXPR;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.METADATA;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.NAME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.VIRTUAL;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_ROWTIME;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_DATA_TYPE;
+import static org.apache.paimon.flink.utils.FlinkDescriptorProperties.WATERMARK_STRATEGY_EXPR;
 import static org.assertj.core.api.Assertions.assertThat;
 
 /** Test for {@link FlinkCatalogPropertiesUtil}. */
@@ -49,18 +57,27 @@ public class FlinkCatalogPropertiesUtilTest {
 
     @Test
     public void testSerDeNonPhysicalColumns() {
-        Map<String, Integer> indexMap = new HashMap<>();
-        indexMap.put("comp", 2);
-        indexMap.put("meta1", 3);
-        indexMap.put("meta2", 5);
-        List<TableColumn> columns = new ArrayList<>();
-        columns.add(TableColumn.computed("comp", DataTypes.INT(), "`k` * 2"));
-        columns.add(TableColumn.metadata("meta1", DataTypes.VARCHAR(10)));
-        columns.add(TableColumn.metadata("meta2", DataTypes.BIGINT().notNull(), "price", true));
+        List<Schema.UnresolvedColumn> columns = new ArrayList<>();
+        columns.add(new Schema.UnresolvedComputedColumn("comp", new SqlCallExpression("`k` * 2")));
+        columns.add(
+                new Schema.UnresolvedMetadataColumn("meta1", DataTypes.VARCHAR(10), null, false));
+        columns.add(
+                new Schema.UnresolvedMetadataColumn(
+                        "meta2", DataTypes.BIGINT().notNull(), "price", true, null));
+
+        List<Column> resolvedColumns = new ArrayList<>();
+        resolvedColumns.add(Column.physical("phy1", DataTypes.INT()));
+        resolvedColumns.add(Column.physical("phy2", DataTypes.INT()));
+        resolvedColumns.add(
+                Column.computed("comp", new TestResolvedExpression("`k` * 2", DataTypes.INT())));
+        resolvedColumns.add(Column.metadata("meta1", DataTypes.VARCHAR(10), null, false));
+        resolvedColumns.add(Column.physical("phy3", DataTypes.INT()));
+        resolvedColumns.add(Column.metadata("meta2", DataTypes.BIGINT().notNull(), "price", true));
 
         // validate serialization
         Map<String, String> serialized =
-                FlinkCatalogPropertiesUtil.serializeNonPhysicalColumns(indexMap, columns);
+                FlinkCatalogPropertiesUtil.serializeNonPhysicalNewColumns(
+                        new ResolvedSchema(resolvedColumns, Collections.emptyList(), null));
 
         Map<String, String> expected = new HashMap<>();
         expected.put(compoundKey(SCHEMA, 2, NAME), "comp");
@@ -80,27 +97,26 @@ public void testSerDeNonPhysicalColumns() {
         assertThat(serialized).containsExactlyInAnyOrderEntriesOf(expected);
 
         // validate deserialization
-        List<TableColumn> deserialized = new ArrayList<>();
-        deserialized.add(FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 2));
-        deserialized.add(FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 3));
-        deserialized.add(FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 5));
+        Schema.Builder builder = Schema.newBuilder();
+        FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 2, builder);
+        FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 3, builder);
+        FlinkCatalogPropertiesUtil.deserializeNonPhysicalColumn(serialized, 5, builder);
 
-        assertThat(deserialized).isEqualTo(columns);
-
-        // validate that
+        assertThat(builder.build().getColumns())
+                .containsExactly(columns.toArray(new Schema.UnresolvedColumn[0]));
     }
 
     @Test
     public void testSerDeWatermarkSpec() {
         WatermarkSpec watermarkSpec =
-                new WatermarkSpec(
+                WatermarkSpec.of(
                         "test_time",
-                        "`test_time` - INTERVAL '0.001' SECOND",
-                        DataTypes.TIMESTAMP(3));
+                        new TestResolvedExpression(
+                                "`test_time` - INTERVAL '0.001' SECOND", DataTypes.TIMESTAMP(3)));
 
         // validate serialization
         Map<String, String> serialized =
-                FlinkCatalogPropertiesUtil.serializeWatermarkSpec(watermarkSpec);
+                FlinkCatalogPropertiesUtil.serializeNewWatermarkSpec(watermarkSpec);
 
         Map<String, String> expected = new HashMap<>();
         String watermarkPrefix = compoundKey(SCHEMA, WATERMARK, 0);
@@ -113,9 +129,13 @@ public void testSerDeWatermarkSpec() {
         assertThat(serialized).containsExactlyInAnyOrderEntriesOf(expected);
 
         // validate serialization
-        WatermarkSpec deserialized =
-                FlinkCatalogPropertiesUtil.deserializeWatermarkSpec(serialized);
-        assertThat(deserialized).isEqualTo(watermarkSpec);
+        Schema.Builder builder = Schema.newBuilder();
+        FlinkCatalogPropertiesUtil.deserializeWatermarkSpec(serialized, builder);
+        assertThat(builder.build().getWatermarkSpecs()).hasSize(1);
+        Schema.UnresolvedWatermarkSpec actual = builder.build().getWatermarkSpecs().get(0);
+        assertThat(actual.getColumnName()).isEqualTo(watermarkSpec.getRowtimeAttribute());
+        assertThat(actual.getWatermarkExpression().asSummaryString())
+                .isEqualTo(watermarkSpec.getWatermarkExpression().asSummaryString());
     }
 
     @Test
@@ -150,4 +170,44 @@ public void testNonPhysicalColumnsCount() {
                                 oldStyleOptions, Arrays.asList("phy1", "phy2")))
                 .isEqualTo(3);
     }
+
+    private static class TestResolvedExpression implements ResolvedExpression {
+        private final String name;
+        private final DataType outputDataType;
+
+        private TestResolvedExpression(String name, DataType outputDataType) {
+            this.name = name;
+            this.outputDataType = outputDataType;
+        }
+
+        @Override
+        public DataType getOutputDataType() {
+            return outputDataType;
+        }
+
+        @Override
+        public List<ResolvedExpression> getResolvedChildren() {
+            return Collections.emptyList();
+        }
+
+        @Override
+        public String asSummaryString() {
+            return new SqlCallExpression(name).asSummaryString();
+        }
+
+        @Override
+        public String asSerializableString() {
+            return name;
+        }
+
+        @Override
+        public List<Expression> getChildren() {
+            return Collections.emptyList();
+        }
+
+        @Override
+        public <R> R accept(ExpressionVisitor<R> expressionVisitor) {
+            return null;
+        }
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogTest.java
index 27a89510975f3..e4286eb18172d 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FlinkCatalogTest.java
@@ -850,7 +850,7 @@ private static void checkEquals(CatalogBaseTable t1, CatalogBaseTable t2) {
         assertThat(t2.getComment()).isEqualTo(t1.getComment());
         assertThat(t2.getOptions()).isEqualTo(t1.getOptions());
         if (t1.getTableKind() == CatalogBaseTable.TableKind.TABLE) {
-            assertThat(t2.getSchema()).isEqualTo(t1.getSchema());
+            assertThat(t2.getUnresolvedSchema()).isEqualTo(t1.getUnresolvedSchema());
             assertThat(((CatalogTable) (t2)).getPartitionKeys())
                     .isEqualTo(((CatalogTable) (t1)).getPartitionKeys());
             assertThat(((CatalogTable) (t2)).isPartitioned())
@@ -864,7 +864,12 @@ private static void checkEquals(CatalogBaseTable t1, CatalogBaseTable t2) {
                                             t2.getUnresolvedSchema()
                                                     .resolve(new TestSchemaResolver()))
                                     .build())
-                    .isEqualTo(t1.getSchema().toSchema());
+                    .isEqualTo(
+                            Schema.newBuilder()
+                                    .fromResolvedSchema(
+                                            t1.getUnresolvedSchema()
+                                                    .resolve(new TestSchemaResolver()))
+                                    .build());
             assertThat(mt2.getPartitionKeys()).isEqualTo(mt1.getPartitionKeys());
             assertThat(mt2.isPartitioned()).isEqualTo(mt1.isPartitioned());
             // validate definition query

From 3c820828062abef86b278f5a0334b6e65570c54b Mon Sep 17 00:00:00 2001
From: WenjunMin <aitozi@apache.org>
Date: Mon, 2 Dec 2024 21:42:22 +0800
Subject: [PATCH 095/157] [core] Make default of 'lookup.local-file-type' to
 sort (#4622)

---
 docs/layouts/shortcodes/generated/core_configuration.html    | 2 +-
 .../paimon/benchmark/lookup/AbstractLookupBenchmark.java     | 5 ++++-
 .../paimon/benchmark/lookup/LookupReaderBenchmark.java       | 2 +-
 .../src/main/java/org/apache/paimon/CoreOptions.java         | 2 +-
 .../main/java/org/apache/paimon/io/cache/CacheBuilder.java   | 4 ++++
 5 files changed, 11 insertions(+), 4 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index fad1f4907e5a9..2ad5db28b9ba1 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -443,7 +443,7 @@
         </tr>
         <tr>
             <td><h5>lookup.local-file-type</h5></td>
-            <td style="word-wrap: break-word;">hash</td>
+            <td style="word-wrap: break-word;">sort</td>
             <td><p>Enum</p></td>
             <td>The local file type for lookup.<br /><br />Possible values:<ul><li>"sort": Construct a sorted file for lookup.</li><li>"hash": Construct a hash file for lookup.</li></ul></td>
         </tr>
diff --git a/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/AbstractLookupBenchmark.java b/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/AbstractLookupBenchmark.java
index 635d876f7a985..653bfee6cc00f 100644
--- a/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/AbstractLookupBenchmark.java
+++ b/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/AbstractLookupBenchmark.java
@@ -102,7 +102,10 @@ protected Pair<String, LookupStoreFactory.Context> writeData(
                         new CacheManager(MemorySize.ofMebiBytes(10)),
                         keySerializer.createSliceComparator());
 
-        File file = new File(tempDir.toFile(), UUID.randomUUID().toString());
+        String name =
+                String.format(
+                        "%s-%s-%s", options.lookupLocalFileType(), valueLength, bloomFilterEnabled);
+        File file = new File(tempDir.toFile(), UUID.randomUUID() + "-" + name);
         LookupStoreWriter writer = factory.createWriter(file, createBloomFiler(bloomFilterEnabled));
         int i = 0;
         for (byte[] input : inputs) {
diff --git a/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/LookupReaderBenchmark.java b/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/LookupReaderBenchmark.java
index 9947b54a70f0c..2d8de84327d46 100644
--- a/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/LookupReaderBenchmark.java
+++ b/paimon-benchmark/paimon-micro-benchmarks/src/test/java/org/apache/paimon/benchmark/lookup/LookupReaderBenchmark.java
@@ -128,7 +128,7 @@ private void readData(
         LookupStoreFactory factory =
                 LookupStoreFactory.create(
                         options,
-                        new CacheManager(MemorySize.ofMebiBytes(10)),
+                        new CacheManager(MemorySize.ofMebiBytes(20), 0.5),
                         new RowCompactedSerializer(RowType.of(new IntType()))
                                 .createSliceComparator());
 
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index b9b5675f1d2d5..cddef33c276e5 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -891,7 +891,7 @@ public class CoreOptions implements Serializable {
     public static final ConfigOption<LookupLocalFileType> LOOKUP_LOCAL_FILE_TYPE =
             key("lookup.local-file-type")
                     .enumType(LookupLocalFileType.class)
-                    .defaultValue(LookupLocalFileType.HASH)
+                    .defaultValue(LookupLocalFileType.SORT)
                     .withDescription("The local file type for lookup.");
 
     public static final ConfigOption<Float> LOOKUP_HASH_LOAD_FACTOR =
diff --git a/paimon-common/src/main/java/org/apache/paimon/io/cache/CacheBuilder.java b/paimon-common/src/main/java/org/apache/paimon/io/cache/CacheBuilder.java
index 4660343d45e1e..402f21f06264d 100644
--- a/paimon-common/src/main/java/org/apache/paimon/io/cache/CacheBuilder.java
+++ b/paimon-common/src/main/java/org/apache/paimon/io/cache/CacheBuilder.java
@@ -72,6 +72,10 @@ public Cache build() {
                     org.apache.paimon.shade.guava30.com.google.common.cache.CacheBuilder
                             .newBuilder()
                             .weigher(CacheBuilder::weigh)
+                            // The concurrency level determines the number of segment caches in
+                            // Guava,limiting the maximum block entries held in cache. Since we do
+                            // not access this cache concurrently, it is set to 1.
+                            .concurrencyLevel(1)
                             .maximumWeight(memorySize.getBytes())
                             .removalListener(this::onRemoval)
                             .build());

From 039046a0d4d4aa4195f9187b2d0214f277316ce8 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Mon, 2 Dec 2024 22:52:10 +0800
Subject: [PATCH 096/157] [core] Extract decompressBlock method in
 SortLookupStoreReader

---
 .../lookup/sort/SortLookupStoreReader.java    | 65 +++++++++----------
 1 file changed, 32 insertions(+), 33 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/lookup/sort/SortLookupStoreReader.java b/paimon-common/src/main/java/org/apache/paimon/lookup/sort/SortLookupStoreReader.java
index 39997888ce92f..6dbfe130e3bb0 100644
--- a/paimon-common/src/main/java/org/apache/paimon/lookup/sort/SortLookupStoreReader.java
+++ b/paimon-common/src/main/java/org/apache/paimon/lookup/sort/SortLookupStoreReader.java
@@ -106,7 +106,7 @@ public byte[] lookup(byte[] key) throws IOException {
         return null;
     }
 
-    private BlockIterator getNextBlock() throws IOException {
+    private BlockIterator getNextBlock() {
         // index block handle, point to the key, value position.
         MemorySlice blockHandle = indexBlockIterator.next().getValue();
         BlockReader dataBlock =
@@ -134,42 +134,41 @@ private BlockReader readBlock(BlockHandle blockHandle, boolean index) {
                 blockCache.getBlock(
                         blockHandle.offset(),
                         blockHandle.size(),
-                        bytes -> {
-                            MemorySegment block = MemorySegment.wrap(bytes);
-                            int crc32cCode = crc32c(block, blockTrailer.getCompressionType());
-                            checkArgument(
-                                    blockTrailer.getCrc32c() == crc32cCode,
-                                    String.format(
-                                            "Expected CRC32C(%d) but found CRC32C(%d) for file(%s)",
-                                            blockTrailer.getCrc32c(), crc32cCode, filePath));
-
-                            // decompress data
-                            BlockCompressionFactory compressionFactory =
-                                    BlockCompressionFactory.create(
-                                            blockTrailer.getCompressionType());
-                            if (compressionFactory == null) {
-                                return bytes;
-                            } else {
-                                MemorySliceInput compressedInput =
-                                        MemorySlice.wrap(block).toInput();
-                                byte[] uncompressed = new byte[compressedInput.readVarLenInt()];
-                                BlockDecompressor decompressor =
-                                        compressionFactory.getDecompressor();
-                                int uncompressedLength =
-                                        decompressor.decompress(
-                                                block.getHeapMemory(),
-                                                compressedInput.position(),
-                                                compressedInput.available(),
-                                                uncompressed,
-                                                0);
-                                checkArgument(uncompressedLength == uncompressed.length);
-                                return uncompressed;
-                            }
-                        },
+                        bytes -> decompressBlock(bytes, blockTrailer),
                         index);
         return new BlockReader(MemorySlice.wrap(unCompressedBlock), comparator);
     }
 
+    private byte[] decompressBlock(byte[] compressedBytes, BlockTrailer blockTrailer) {
+        MemorySegment compressed = MemorySegment.wrap(compressedBytes);
+        int crc32cCode = crc32c(compressed, blockTrailer.getCompressionType());
+        checkArgument(
+                blockTrailer.getCrc32c() == crc32cCode,
+                String.format(
+                        "Expected CRC32C(%d) but found CRC32C(%d) for file(%s)",
+                        blockTrailer.getCrc32c(), crc32cCode, filePath));
+
+        // decompress data
+        BlockCompressionFactory compressionFactory =
+                BlockCompressionFactory.create(blockTrailer.getCompressionType());
+        if (compressionFactory == null) {
+            return compressedBytes;
+        } else {
+            MemorySliceInput compressedInput = MemorySlice.wrap(compressed).toInput();
+            byte[] uncompressed = new byte[compressedInput.readVarLenInt()];
+            BlockDecompressor decompressor = compressionFactory.getDecompressor();
+            int uncompressedLength =
+                    decompressor.decompress(
+                            compressed.getHeapMemory(),
+                            compressedInput.position(),
+                            compressedInput.available(),
+                            uncompressed,
+                            0);
+            checkArgument(uncompressedLength == uncompressed.length);
+            return uncompressed;
+        }
+    }
+
     @Override
     public void close() throws IOException {
         if (bloomFilter != null) {

From 300cc67c208c4b86e2edf58ad1981b86649fe892 Mon Sep 17 00:00:00 2001
From: Yann Byron <biyan900116@gmail.com>
Date: Tue, 3 Dec 2024 11:35:16 +0800
Subject: [PATCH 097/157] [spark] show table extended (#4603)

* [spark] show table extended

* update

* [update] doc
---
 docs/content/spark/auxiliary.md               |  11 ++
 .../spark/PaimonPartitionManagement.scala     |   2 +-
 .../analysis/PaimonResolvePartitionSpec.scala |  75 +++++++++++
 .../PaimonSparkSessionExtensions.scala        |   2 +
 .../org/apache/spark/sql/PaimonUtils.scala    |  19 +++
 .../catalog/PaimonCatalogImplicits.scala      |  30 +++++
 .../catalog/PaimonCatalogUtils.scala          |   3 +
 .../spark/sql/paimon/shims/SparkShim.scala    |   4 +
 .../paimon/spark/sql/DescribeTableTest.scala  |  70 ++++++++++
 .../analysis/Spark3ResolutionRules.scala      |  56 ++++++++
 .../PaimonShowTablePartitionCommand.scala     |  96 ++++++++++++++
 .../PaimonShowTablesExtendedCommand.scala     | 123 ++++++++++++++++++
 .../spark/sql/paimon/shims/Spark3Shim.scala   |   8 +-
 .../analysis/Spark4ResolutionRules.scala      |  27 ++++
 .../spark/sql/paimon/shims/Spark4Shim.scala   |   9 +-
 15 files changed, 532 insertions(+), 3 deletions(-)
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonResolvePartitionSpec.scala
 create mode 100644 paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogImplicits.scala
 create mode 100644 paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark3ResolutionRules.scala
 create mode 100644 paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablePartitionCommand.scala
 create mode 100644 paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablesExtendedCommand.scala
 create mode 100644 paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark4ResolutionRules.scala

diff --git a/docs/content/spark/auxiliary.md b/docs/content/spark/auxiliary.md
index 6330ca27ce312..5de0289565f2f 100644
--- a/docs/content/spark/auxiliary.md
+++ b/docs/content/spark/auxiliary.md
@@ -96,6 +96,17 @@ SHOW PARTITIONS my_table;
 SHOW PARTITIONS my_table PARTITION (dt=20230817);
 ```
 
+## Show Table Extended
+The SHOW TABLE EXTENDED statement is used to list table or partition information.
+
+```sql
+-- Lists tables that satisfy regular expressions
+SHOW TABLE EXTENDED IN db_name LIKE 'test*';
+
+-- Lists the specified partition information for the table
+SHOW TABLE EXTENDED IN db_name LIKE 'table_name' PARTITION(pt = '2024');
+```
+
 ## Analyze table
 
 The ANALYZE TABLE statement collects statistics about the table, that are to be used by the query optimizer to find a better query execution plan.
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
index 9a305ca59a0f1..840f1341a69d7 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonPartitionManagement.scala
@@ -100,7 +100,7 @@ trait PaimonPartitionManagement extends SupportsAtomicPartitionManagement {
   }
 
   override def loadPartitionMetadata(ident: InternalRow): JMap[String, String] = {
-    throw new UnsupportedOperationException("Load partition is not supported")
+    Map.empty[String, String].asJava
   }
 
   override def listPartitionIdentifiers(
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonResolvePartitionSpec.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonResolvePartitionSpec.scala
new file mode 100644
index 0000000000000..5d6a5a063c06d
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonResolvePartitionSpec.scala
@@ -0,0 +1,75 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.analysis
+
+import org.apache.spark.sql.PaimonUtils.{normalizePartitionSpec, requireExactMatchedPartitionSpec}
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.analysis.{PartitionSpec, ResolvedPartitionSpec, UnresolvedPartitionSpec}
+import org.apache.spark.sql.catalyst.analysis.ResolvePartitionSpec.conf
+import org.apache.spark.sql.catalyst.catalog.CatalogTypes.TablePartitionSpec
+import org.apache.spark.sql.catalyst.expressions.{Cast, Literal}
+import org.apache.spark.sql.catalyst.util.CharVarcharUtils
+import org.apache.spark.sql.connector.catalog.{Identifier, TableCatalog}
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Implicits._
+import org.apache.spark.sql.types.{StringType, StructField, StructType}
+
+object PaimonResolvePartitionSpec {
+
+  def resolve(
+      catalog: TableCatalog,
+      tableIndent: Identifier,
+      partitionSpec: PartitionSpec): ResolvedPartitionSpec = {
+    val table = catalog.loadTable(tableIndent).asPartitionable
+    partitionSpec match {
+      case u: UnresolvedPartitionSpec =>
+        val partitionSchema = table.partitionSchema()
+        resolvePartitionSpec(table.name(), u, partitionSchema, allowPartitionSpec = false)
+      case o => o.asInstanceOf[ResolvedPartitionSpec]
+    }
+  }
+
+  private def resolvePartitionSpec(
+      tableName: String,
+      partSpec: UnresolvedPartitionSpec,
+      partSchema: StructType,
+      allowPartitionSpec: Boolean): ResolvedPartitionSpec = {
+    val normalizedSpec = normalizePartitionSpec(partSpec.spec, partSchema, tableName, conf.resolver)
+    if (!allowPartitionSpec) {
+      requireExactMatchedPartitionSpec(tableName, normalizedSpec, partSchema.fieldNames)
+    }
+    val partitionNames = normalizedSpec.keySet
+    val requestedFields = partSchema.filter(field => partitionNames.contains(field.name))
+    ResolvedPartitionSpec(
+      requestedFields.map(_.name),
+      convertToPartIdent(normalizedSpec, requestedFields),
+      partSpec.location)
+  }
+
+  def convertToPartIdent(
+      partitionSpec: TablePartitionSpec,
+      schema: Seq[StructField]): InternalRow = {
+    val partValues = schema.map {
+      part =>
+        val raw = partitionSpec.get(part.name).orNull
+        val dt = CharVarcharUtils.replaceCharVarcharWithString(part.dataType)
+        Cast(Literal.create(raw, StringType), dt, Some(conf.sessionLocalTimeZone)).eval()
+    }
+    InternalRow.fromSeq(partValues)
+  }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
index e8f75d394a818..f73df64fb8ab6 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/extensions/PaimonSparkSessionExtensions.scala
@@ -40,6 +40,8 @@ class PaimonSparkSessionExtensions extends (SparkSessionExtensions => Unit) {
     extensions.injectResolutionRule(spark => new PaimonAnalysis(spark))
     extensions.injectResolutionRule(spark => PaimonProcedureResolver(spark))
     extensions.injectResolutionRule(spark => PaimonViewResolver(spark))
+    extensions.injectResolutionRule(
+      spark => SparkShimLoader.getSparkShim.createCustomResolution(spark))
     extensions.injectResolutionRule(spark => PaimonIncompatibleResolutionRules(spark))
 
     extensions.injectPostHocResolutionRule(spark => PaimonPostHocResolutionRules(spark))
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/PaimonUtils.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/PaimonUtils.scala
index 4492d856ad509..cc49e787dc81c 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/PaimonUtils.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/PaimonUtils.scala
@@ -20,11 +20,15 @@ package org.apache.spark.sql
 
 import org.apache.spark.executor.OutputMetrics
 import org.apache.spark.rdd.InputFileBlockHolder
+import org.apache.spark.sql.catalyst.analysis.Resolver
+import org.apache.spark.sql.catalyst.catalog.CatalogTypes.TablePartitionSpec
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.connector.expressions.{FieldReference, NamedReference}
 import org.apache.spark.sql.execution.datasources.DataSourceStrategy
 import org.apache.spark.sql.sources.Filter
+import org.apache.spark.sql.types.StructType
+import org.apache.spark.sql.util.PartitioningUtils
 import org.apache.spark.util.{Utils => SparkUtils}
 
 /**
@@ -87,4 +91,19 @@ object PaimonUtils {
     outputMetrics.setBytesWritten(bytesWritten)
     outputMetrics.setRecordsWritten(recordsWritten)
   }
+
+  def normalizePartitionSpec[T](
+      partitionSpec: Map[String, T],
+      partCols: StructType,
+      tblName: String,
+      resolver: Resolver): Map[String, T] = {
+    PartitioningUtils.normalizePartitionSpec(partitionSpec, partCols, tblName, resolver)
+  }
+
+  def requireExactMatchedPartitionSpec(
+      tableName: String,
+      spec: TablePartitionSpec,
+      partitionColumnNames: Seq[String]): Unit = {
+    PartitioningUtils.requireExactMatchedPartitionSpec(tableName, spec, partitionColumnNames)
+  }
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogImplicits.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogImplicits.scala
new file mode 100644
index 0000000000000..f1f20fb6fb31d
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogImplicits.scala
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connector.catalog
+
+object PaimonCatalogImplicits {
+
+  import CatalogV2Implicits._
+
+  implicit class PaimonCatalogHelper(plugin: CatalogPlugin) extends CatalogHelper(plugin)
+
+  implicit class PaimonNamespaceHelper(namespace: Array[String]) extends NamespaceHelper(namespace)
+
+//  implicit class PaimonTableHelper(table: Table) extends TableHelper(table)
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
index 2ab3dc4945245..5db6894ba093b 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/connector/catalog/PaimonCatalogUtils.scala
@@ -22,6 +22,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.spark.SparkConf
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.catalog.ExternalCatalog
+import org.apache.spark.sql.connector.catalog.CatalogV2Util
 import org.apache.spark.sql.internal.StaticSQLConf.CATALOG_IMPLEMENTATION
 import org.apache.spark.sql.paimon.ReflectUtils
 
@@ -40,4 +41,6 @@ object PaimonCatalogUtils {
       hadoopConf)
   }
 
+  val TABLE_RESERVED_PROPERTIES: Seq[String] = CatalogV2Util.TABLE_RESERVED_PROPERTIES
+
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
index bd85282737e99..334bd6e93180e 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/paimon/shims/SparkShim.scala
@@ -24,6 +24,8 @@ import org.apache.paimon.types.{DataType, RowType}
 import org.apache.spark.sql.{Column, SparkSession}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
 import org.apache.spark.sql.catalyst.parser.ParserInterface
+import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.connector.catalog.{Identifier, Table, TableCatalog}
 import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.types.StructType
@@ -39,6 +41,8 @@ trait SparkShim {
 
   def createSparkParser(delegate: ParserInterface): ParserInterface
 
+  def createCustomResolution(spark: SparkSession): Rule[LogicalPlan]
+
   def createSparkInternalRow(rowType: RowType): SparkInternalRow
 
   def createSparkArrayData(elementType: DataType): SparkArrayData
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
index 528dcd3cd107a..ae538fa48c4e2 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DescribeTableTest.scala
@@ -27,6 +27,76 @@ import java.util.Objects
 
 class DescribeTableTest extends PaimonSparkTestBase {
 
+  test("Paimon show: show table extended") {
+    val testDB = "test_show"
+    withDatabase(testDB) {
+      spark.sql("CREATE TABLE s1 (id INT)")
+
+      spark.sql(s"CREATE DATABASE $testDB")
+      spark.sql(s"USE $testDB")
+      spark.sql("CREATE TABLE s2 (id INT, pt STRING) PARTITIONED BY (pt)")
+      spark.sql("CREATE TABLE s3 (id INT, pt1 STRING, pt2 STRING) PARTITIONED BY (pt1, pt2)")
+
+      spark.sql("INSERT INTO s2 VALUES (1, '2024'), (2, '2024'), (3, '2025'), (4, '2026')")
+      spark.sql("""
+                  |INSERT INTO s3
+                  |VALUES
+                  |(1, '2024', '11'), (2, '2024', '12'), (3, '2025', '11'), (4, '2025', '12')
+                  |""".stripMargin)
+
+      // SHOW TABL EXTENDED will give four columns: namespace, tableName, isTemporary, information.
+      checkAnswer(
+        sql(s"SHOW TABLE EXTENDED IN $dbName0 LIKE '*'")
+          .select("namespace", "tableName", "isTemporary"),
+        Row("test", "s1", false))
+      checkAnswer(
+        sql(s"SHOW TABLE EXTENDED IN $testDB LIKE '*'")
+          .select("namespace", "tableName", "isTemporary"),
+        Row(testDB, "s2", false) :: Row(testDB, "s3", false) :: Nil
+      )
+
+      // check table s1
+      val res1 = spark.sql(s"SHOW TABLE EXTENDED IN $testDB LIKE 's2'").select("information")
+      Assertions.assertEquals(1, res1.count())
+      val information1 = res1
+        .collect()
+        .head
+        .getString(0)
+        .split("\n")
+        .map {
+          line =>
+            val kv = line.split(": ", 2)
+            kv(0) -> kv(1)
+        }
+        .toMap
+      Assertions.assertEquals(information1("Catalog"), "paimon")
+      Assertions.assertEquals(information1("Namespace"), testDB)
+      Assertions.assertEquals(information1("Table"), "s2")
+      Assertions.assertEquals(information1("Provider"), "paimon")
+      Assertions.assertEquals(information1("Location"), loadTable(testDB, "s2").location().toString)
+
+      // check table s2 partition info
+      val error1 = intercept[Exception] {
+        spark.sql(s"SHOW TABLE EXTENDED IN $testDB LIKE 's2' PARTITION(pt='2022')")
+      }.getMessage
+      assert(error1.contains("PARTITIONS_NOT_FOUND"))
+
+      val error2 = intercept[Exception] {
+        spark.sql(s"SHOW TABLE EXTENDED IN $testDB LIKE 's3' PARTITION(pt1='2024')")
+      }.getMessage
+      assert(error2.contains("Partition spec is invalid"))
+
+      val res2 =
+        spark.sql(s"SHOW TABLE EXTENDED IN $testDB LIKE 's3' PARTITION(pt1 = '2024', pt2 = 11)")
+      checkAnswer(
+        res2.select("namespace", "tableName", "isTemporary"),
+        Row(testDB, "s3", false)
+      )
+      Assertions.assertTrue(
+        res2.select("information").collect().head.getString(0).contains("Partition Values"))
+    }
+  }
+
   test(s"Paimon describe: describe table comment") {
     var comment = "test comment"
     spark.sql(s"""
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark3ResolutionRules.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark3ResolutionRules.scala
new file mode 100644
index 0000000000000..924df2d1e3206
--- /dev/null
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark3ResolutionRules.scala
@@ -0,0 +1,56 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.analysis
+
+import org.apache.paimon.spark.commands.{PaimonShowTablePartitionCommand, PaimonShowTablesExtendedCommand}
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.SQLConfHelper
+import org.apache.spark.sql.catalyst.analysis.{PartitionSpec, ResolvedNamespace, UnresolvedPartitionSpec}
+import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, ShowTableExtended}
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.connector.catalog.Identifier
+
+case class Spark3ResolutionRules(session: SparkSession)
+  extends Rule[LogicalPlan]
+  with SQLConfHelper {
+
+  import org.apache.spark.sql.connector.catalog.PaimonCatalogImplicits._
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsDown {
+    case ShowTableExtended(
+          ResolvedNamespace(catalog, ns),
+          pattern,
+          partitionSpec @ (None | Some(UnresolvedPartitionSpec(_, _))),
+          output) =>
+      partitionSpec
+        .map {
+          spec: PartitionSpec =>
+            val table = Identifier.of(ns.toArray, pattern)
+            val resolvedSpec =
+              PaimonResolvePartitionSpec.resolve(catalog.asTableCatalog, table, spec)
+            PaimonShowTablePartitionCommand(output, catalog.asTableCatalog, table, resolvedSpec)
+        }
+        .getOrElse {
+          PaimonShowTablesExtendedCommand(catalog.asTableCatalog, ns, pattern, output)
+        }
+
+  }
+
+}
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablePartitionCommand.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablePartitionCommand.scala
new file mode 100644
index 0000000000000..32f94985859cf
--- /dev/null
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablePartitionCommand.scala
@@ -0,0 +1,96 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.commands
+
+import org.apache.paimon.spark.leafnode.PaimonLeafRunnableCommand
+
+import org.apache.spark.sql.{Row, SparkSession}
+import org.apache.spark.sql.catalyst.analysis.ResolvedPartitionSpec
+import org.apache.spark.sql.catalyst.catalog.ExternalCatalogUtils.escapePathName
+import org.apache.spark.sql.catalyst.expressions.{Attribute, ToPrettyString}
+import org.apache.spark.sql.catalyst.expressions.Literal
+import org.apache.spark.sql.connector.catalog.{Identifier, SupportsPartitionManagement, TableCatalog}
+import org.apache.spark.sql.connector.catalog.PaimonCatalogImplicits._
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Implicits._
+
+import scala.collection.JavaConverters._
+import scala.collection.mutable
+
+case class PaimonShowTablePartitionCommand(
+    override val output: Seq[Attribute],
+    catalog: TableCatalog,
+    tableIndent: Identifier,
+    partSpec: ResolvedPartitionSpec)
+  extends PaimonLeafRunnableCommand {
+  override def run(sparkSession: SparkSession): Seq[Row] = {
+    val rows = new mutable.ArrayBuffer[Row]()
+    val table = catalog.loadTable(tableIndent)
+    val information = getTablePartitionDetails(tableIndent, table.asPartitionable, partSpec)
+    rows += Row(tableIndent.namespace.quoted, tableIndent.name(), false, s"$information\n")
+
+    rows.toSeq
+  }
+
+  private def getTablePartitionDetails(
+      tableIdent: Identifier,
+      partitionTable: SupportsPartitionManagement,
+      partSpec: ResolvedPartitionSpec): String = {
+    val results = new mutable.LinkedHashMap[String, String]()
+
+    // "Partition Values"
+    val partitionSchema = partitionTable.partitionSchema()
+    val (names, ident) = (partSpec.names, partSpec.ident)
+    val partitionIdentifiers = partitionTable.listPartitionIdentifiers(names.toArray, ident)
+    if (partitionIdentifiers.isEmpty) {
+      val part = ident
+        .toSeq(partitionSchema)
+        .zip(partitionSchema.map(_.name))
+        .map(kv => s"${kv._2}" + s" = ${kv._1}")
+        .mkString(", ")
+      throw new RuntimeException(
+        s"""
+           |[PARTITIONS_NOT_FOUND] The partition(s) PARTITION ($part) cannot be found in table ${tableIdent.toString}.
+           |Verify the partition specification and table name.
+           |""".stripMargin)
+    }
+    assert(partitionIdentifiers.length == 1)
+    val row = partitionIdentifiers.head
+    val len = partitionSchema.length
+    val partitions = new Array[String](len)
+    val timeZoneId = conf.sessionLocalTimeZone
+    for (i <- 0 until len) {
+      val dataType = partitionSchema(i).dataType
+      val partValueUTF8String =
+        ToPrettyString(Literal(row.get(i, dataType), dataType), Some(timeZoneId)).eval(null)
+      val partValueStr = if (partValueUTF8String == null) "null" else partValueUTF8String.toString
+      partitions(i) = escapePathName(partitionSchema(i).name) + "=" + escapePathName(partValueStr)
+    }
+    val partitionValues = partitions.mkString("[", ", ", "]")
+    results.put("Partition Values", s"$partitionValues")
+
+    // TODO "Partition Parameters", "Created Time", "Last Access", "Partition Statistics"
+
+    results
+      .map {
+        case (key, value) =>
+          if (value.isEmpty) key else s"$key: $value"
+      }
+      .mkString("", "\n", "")
+  }
+}
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablesExtendedCommand.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablesExtendedCommand.scala
new file mode 100644
index 0000000000000..b393982e25d3e
--- /dev/null
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/paimon/spark/commands/PaimonShowTablesExtendedCommand.scala
@@ -0,0 +1,123 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.commands
+
+import org.apache.paimon.spark.leafnode.PaimonLeafRunnableCommand
+
+import org.apache.spark.sql.{Row, SparkSession}
+import org.apache.spark.sql.catalyst.catalog.CatalogTableType
+import org.apache.spark.sql.catalyst.catalog.CatalogTypes.TablePartitionSpec
+import org.apache.spark.sql.catalyst.expressions.Attribute
+import org.apache.spark.sql.catalyst.util.{QuotingUtils, StringUtils}
+import org.apache.spark.sql.connector.catalog.{Identifier, PaimonCatalogUtils, SupportsPartitionManagement, Table, TableCatalog}
+import org.apache.spark.sql.connector.catalog.PaimonCatalogImplicits._
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Implicits._
+
+import scala.collection.JavaConverters._
+import scala.collection.mutable
+
+case class PaimonShowTablesExtendedCommand(
+    catalog: TableCatalog,
+    namespace: Seq[String],
+    pattern: String,
+    override val output: Seq[Attribute],
+    isExtended: Boolean = false,
+    partitionSpec: Option[TablePartitionSpec] = None)
+  extends PaimonLeafRunnableCommand {
+
+  override def run(spark: SparkSession): Seq[Row] = {
+    val rows = new mutable.ArrayBuffer[Row]()
+
+    val tables = catalog.listTables(namespace.toArray)
+    tables.map {
+      tableIdent: Identifier =>
+        if (StringUtils.filterPattern(Seq(tableIdent.name()), pattern).nonEmpty) {
+          val table = catalog.loadTable(tableIdent)
+          val information = getTableDetails(catalog.name, tableIdent, table)
+          rows += Row(tableIdent.namespace().quoted, tableIdent.name(), false, s"$information\n")
+        }
+    }
+
+    // TODO: view
+
+    rows.toSeq
+  }
+
+  private def getTableDetails(catalogName: String, identifier: Identifier, table: Table): String = {
+    val results = new mutable.LinkedHashMap[String, String]()
+
+    results.put("Catalog", catalogName)
+    results.put("Namespace", identifier.namespace().quoted)
+    results.put("Table", identifier.name())
+    val tableType = if (table.properties().containsKey(TableCatalog.PROP_EXTERNAL)) {
+      CatalogTableType.EXTERNAL
+    } else {
+      CatalogTableType.MANAGED
+    }
+    results.put("Type", tableType.name)
+
+    PaimonCatalogUtils.TABLE_RESERVED_PROPERTIES
+      .filterNot(_ == TableCatalog.PROP_EXTERNAL)
+      .foreach(
+        propKey => {
+          if (table.properties.containsKey(propKey)) {
+            results.put(propKey.capitalize, table.properties.get(propKey))
+          }
+        })
+
+    val properties: Seq[String] =
+      conf
+        .redactOptions(table.properties.asScala.toMap)
+        .toList
+        .filter(kv => !PaimonCatalogUtils.TABLE_RESERVED_PROPERTIES.contains(kv._1))
+        .sortBy(_._1)
+        .map { case (key, value) => key + "=" + value }
+    if (!table.properties().isEmpty) {
+      results.put("Table Properties", properties.mkString("[", ", ", "]"))
+    }
+
+    // Partition Provider & Partition Columns
+    if (supportsPartitions(table) && table.asPartitionable.partitionSchema().nonEmpty) {
+      results.put("Partition Provider", "Catalog")
+      results.put(
+        "Partition Columns",
+        table.asPartitionable
+          .partitionSchema()
+          .map(field => QuotingUtils.quoteIdentifier(field.name))
+          .mkString("[", ", ", "]"))
+    }
+
+    if (table.schema().nonEmpty) {
+      results.put("Schema", table.schema().treeString)
+    }
+
+    results
+      .map {
+        case (key, value) =>
+          if (value.isEmpty) key else s"$key: $value"
+      }
+      .mkString("", "\n", "")
+  }
+
+  private def supportsPartitions(table: Table): Boolean = table match {
+    case _: SupportsPartitionManagement => true
+    case _ => false
+  }
+
+}
diff --git a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
index 57d79d6474e9a..f508e2605cbc1 100644
--- a/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
+++ b/paimon-spark/paimon-spark3-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark3Shim.scala
@@ -18,6 +18,7 @@
 
 package org.apache.spark.sql.paimon.shims
 
+import org.apache.paimon.spark.catalyst.analysis.Spark3ResolutionRules
 import org.apache.paimon.spark.catalyst.parser.extensions.PaimonSpark3SqlExtensionsParser
 import org.apache.paimon.spark.data.{Spark3ArrayData, Spark3InternalRow, SparkArrayData, SparkInternalRow}
 import org.apache.paimon.types.{DataType, RowType}
@@ -25,7 +26,8 @@ import org.apache.paimon.types.{DataType, RowType}
 import org.apache.spark.sql.{Column, SparkSession}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
 import org.apache.spark.sql.catalyst.parser.ParserInterface
-import org.apache.spark.sql.catalyst.plans.logical.Aggregate
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan}
+import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.connector.catalog.{Identifier, Table, TableCatalog}
 import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.types.StructType
@@ -38,6 +40,10 @@ class Spark3Shim extends SparkShim {
     new PaimonSpark3SqlExtensionsParser(delegate)
   }
 
+  override def createCustomResolution(spark: SparkSession): Rule[LogicalPlan] = {
+    Spark3ResolutionRules(spark)
+  }
+
   override def createSparkInternalRow(rowType: RowType): SparkInternalRow = {
     new Spark3InternalRow(rowType)
   }
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark4ResolutionRules.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark4ResolutionRules.scala
new file mode 100644
index 0000000000000..461cbd0c938ac
--- /dev/null
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/Spark4ResolutionRules.scala
@@ -0,0 +1,27 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.catalyst.analysis
+
+import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.sql.catalyst.rules.Rule
+
+case class Spark4ResolutionRules(session: SparkSession) extends Rule[LogicalPlan] {
+  override def apply(plan: LogicalPlan): LogicalPlan = plan
+}
diff --git a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala
index dfec4eb71f4f1..eefddafdbfb89 100644
--- a/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala
+++ b/paimon-spark/paimon-spark4-common/src/main/scala/org/apache/spark/sql/paimon/shims/Spark4Shim.scala
@@ -18,6 +18,7 @@
 
 package org.apache.spark.sql.paimon.shims
 
+import org.apache.paimon.spark.catalyst.analysis.Spark4ResolutionRules
 import org.apache.paimon.spark.catalyst.parser.extensions.PaimonSpark4SqlExtensionsParser
 import org.apache.paimon.spark.data.{Spark4ArrayData, Spark4InternalRow, SparkArrayData, SparkInternalRow}
 import org.apache.paimon.types.{DataType, RowType}
@@ -25,7 +26,8 @@ import org.apache.paimon.types.{DataType, RowType}
 import org.apache.spark.sql.{Column, SparkSession}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
 import org.apache.spark.sql.catalyst.parser.ParserInterface
-import org.apache.spark.sql.catalyst.plans.logical.Aggregate
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan}
+import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, Table, TableCatalog}
 import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.internal.ExpressionUtils
@@ -38,6 +40,11 @@ class Spark4Shim extends SparkShim {
   override def createSparkParser(delegate: ParserInterface): ParserInterface = {
     new PaimonSpark4SqlExtensionsParser(delegate)
   }
+
+  override def createCustomResolution(spark: SparkSession): Rule[LogicalPlan] = {
+    Spark4ResolutionRules(spark)
+  }
+
   override def createSparkInternalRow(rowType: RowType): SparkInternalRow = {
     new Spark4InternalRow(rowType)
   }

From d33b8711fc6b4e1f35ba7d85336be4ff3baa956d Mon Sep 17 00:00:00 2001
From: "aiden.dong" <782112163@qq.com>
Date: Tue, 3 Dec 2024 13:33:44 +0800
Subject: [PATCH 098/157] [core] Optimization of Parquet Predicate Pushdown
 Capability (#4608)

---
 .../table/PrimaryKeyFileStoreTableTest.java   |  63 ++++++
 .../format/parquet/ParquetReaderFactory.java  |  66 +++++-
 .../parquet/reader/AbstractColumnReader.java  | 204 +++++++++++++-----
 .../parquet/reader/BooleanColumnReader.java   |  36 +++-
 .../parquet/reader/ByteColumnReader.java      |  39 +++-
 .../parquet/reader/BytesColumnReader.java     |  41 +++-
 .../parquet/reader/DoubleColumnReader.java    |  38 +++-
 .../reader/FixedLenBytesColumnReader.java     |  36 +++-
 .../parquet/reader/FloatColumnReader.java     |  38 +++-
 .../parquet/reader/IntColumnReader.java       |  39 +++-
 .../parquet/reader/LongColumnReader.java      |  39 +++-
 .../parquet/reader/NestedColumnReader.java    |   2 +-
 .../reader/NestedPrimitiveColumnReader.java   | 141 +++++++-----
 .../parquet/reader/ParquetReadState.java      | 148 +++++++++++++
 .../reader/ParquetSplitReaderUtil.java        |  41 ++--
 .../parquet/reader/RunLengthDecoder.java      |  45 ++++
 .../parquet/reader/ShortColumnReader.java     |  38 +++-
 .../parquet/reader/TimestampColumnReader.java |  15 +-
 18 files changed, 898 insertions(+), 171 deletions(-)
 create mode 100644 paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java

diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index 46b85223bc2fa..e80b49a0f05df 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -84,6 +84,7 @@
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
+import java.util.Random;
 import java.util.concurrent.ThreadLocalRandom;
 import java.util.concurrent.atomic.AtomicInteger;
 import java.util.function.BiFunction;
@@ -809,6 +810,68 @@ public void testDeletionVectorsWithFileIndexInFile() throws Exception {
                                 "1|4|500|binary|varbinary|mapKey:mapVal|multiset"));
     }
 
+    @Test
+    public void testDeletionVectorsWithParquetFilter() throws Exception {
+        FileStoreTable table =
+                createFileStoreTable(
+                        conf -> {
+                            conf.set(BUCKET, 1);
+                            conf.set(DELETION_VECTORS_ENABLED, true);
+                            conf.set(FILE_FORMAT, "parquet");
+                            conf.set("parquet.block.size", "1048576");
+                            conf.set("parquet.page.size", "1024");
+                        });
+
+        BatchWriteBuilder writeBuilder = table.newBatchWriteBuilder();
+
+        BatchTableWrite write =
+                (BatchTableWrite)
+                        writeBuilder
+                                .newWrite()
+                                .withIOManager(new IOManagerImpl(tempDir.toString()));
+
+        for (int i = 0; i < 200000; i++) {
+            write.write(rowData(1, i, i * 100L));
+        }
+
+        List<CommitMessage> messages = write.prepareCommit();
+        BatchTableCommit commit = writeBuilder.newCommit();
+        commit.commit(messages);
+        write =
+                (BatchTableWrite)
+                        writeBuilder
+                                .newWrite()
+                                .withIOManager(new IOManagerImpl(tempDir.toString()));
+        for (int i = 180000; i < 200000; i++) {
+            write.write(rowDataWithKind(RowKind.DELETE, 1, i, i * 100L));
+        }
+
+        messages = write.prepareCommit();
+        commit = writeBuilder.newCommit();
+        commit.commit(messages);
+
+        PredicateBuilder builder = new PredicateBuilder(ROW_TYPE);
+        List<Split> splits = toSplits(table.newSnapshotReader().read().dataSplits());
+        Random random = new Random();
+
+        for (int i = 0; i < 10; i++) {
+            int value = random.nextInt(180000);
+            TableRead read = table.newRead().withFilter(builder.equal(1, value)).executeFilter();
+            assertThat(getResult(read, splits, BATCH_ROW_TO_STRING))
+                    .isEqualTo(
+                            Arrays.asList(
+                                    String.format(
+                                            "%d|%d|%d|binary|varbinary|mapKey:mapVal|multiset",
+                                            1, value, value * 100L)));
+        }
+
+        for (int i = 0; i < 10; i++) {
+            int value = 180000 + random.nextInt(20000);
+            TableRead read = table.newRead().withFilter(builder.equal(1, value)).executeFilter();
+            assertThat(getResult(read, splits, BATCH_ROW_TO_STRING)).isEmpty();
+        }
+    }
+
     @Test
     public void testDeletionVectorsWithFileIndexInMeta() throws Exception {
         FileStoreTable table =
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index f0151d6f3d8fb..0c996531201a5 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -28,6 +28,7 @@
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.format.parquet.reader.ColumnReader;
 import org.apache.paimon.format.parquet.reader.ParquetDecimalVector;
+import org.apache.paimon.format.parquet.reader.ParquetReadState;
 import org.apache.paimon.format.parquet.reader.ParquetTimestampVector;
 import org.apache.paimon.format.parquet.type.ParquetField;
 import org.apache.paimon.fs.Path;
@@ -130,7 +131,7 @@ public FileRecordReader<InternalRow> createReader(FormatReaderFactory.Context co
                 buildFieldsList(projectedType.getFields(), projectedType.getFieldNames(), columnIO);
 
         return new ParquetReader(
-                reader, requestedSchema, reader.getRecordCount(), poolOfBatches, fields);
+                reader, requestedSchema, reader.getFilteredRecordCount(), poolOfBatches, fields);
     }
 
     private void setReadOptions(ParquetReadOptions.Builder builder) {
@@ -336,6 +337,10 @@ private class ParquetReader implements FileRecordReader<InternalRow> {
 
         private long nextRowPosition;
 
+        private ParquetReadState currentRowGroupReadState;
+
+        private long currentRowGroupFirstRowIndex;
+
         /**
          * For each request column, the reader to read this column. This is NULL if this column is
          * missing from the file, in which case we populate the attribute with NULL.
@@ -359,6 +364,7 @@ private ParquetReader(
             this.totalCountLoadedSoFar = 0;
             this.currentRowPosition = 0;
             this.nextRowPosition = 0;
+            this.currentRowGroupFirstRowIndex = 0;
             this.fields = fields;
         }
 
@@ -390,7 +396,8 @@ private boolean nextBatch(ParquetReaderBatch batch) throws IOException {
                 currentRowPosition = nextRowPosition;
             }
 
-            int num = (int) Math.min(batchSize, totalCountLoadedSoFar - rowsReturned);
+            int num = getBachSize();
+
             for (int i = 0; i < columnReaders.length; ++i) {
                 if (columnReaders[i] == null) {
                     batch.writableVectors[i].fillWithNulls();
@@ -400,13 +407,13 @@ private boolean nextBatch(ParquetReaderBatch batch) throws IOException {
                 }
             }
             rowsReturned += num;
-            nextRowPosition = currentRowPosition + num;
+            nextRowPosition = getNextRowPosition(num);
             batch.columnarBatch.setNumRows(num);
             return true;
         }
 
         private void readNextRowGroup() throws IOException {
-            PageReadStore rowGroup = reader.readNextRowGroup();
+            PageReadStore rowGroup = reader.readNextFilteredRowGroup();
             if (rowGroup == null) {
                 throw new IOException(
                         "expecting more rows but reached last block. Read "
@@ -415,6 +422,9 @@ private void readNextRowGroup() throws IOException {
                                 + totalRowCount);
             }
 
+            this.currentRowGroupReadState =
+                    new ParquetReadState(rowGroup.getRowIndexes().orElse(null));
+
             List<Type> types = requestedSchema.getFields();
             columnReaders = new ColumnReader[types.size()];
             for (int i = 0; i < types.size(); ++i) {
@@ -429,18 +439,62 @@ private void readNextRowGroup() throws IOException {
                                     0);
                 }
             }
+
             totalCountLoadedSoFar += rowGroup.getRowCount();
-            if (rowGroup.getRowIndexOffset().isPresent()) {
-                currentRowPosition = rowGroup.getRowIndexOffset().get();
+
+            if (rowGroup.getRowIndexOffset().isPresent()) { // filter
+                currentRowGroupFirstRowIndex = rowGroup.getRowIndexOffset().get();
+                long pageIndex = 0;
+                if (!this.currentRowGroupReadState.isMaxRange()) {
+                    pageIndex = this.currentRowGroupReadState.currentRangeStart();
+                }
+                currentRowPosition = currentRowGroupFirstRowIndex + pageIndex;
             } else {
                 if (reader.rowGroupsFiltered()) {
                     throw new RuntimeException(
                             "There is a bug, rowIndexOffset must be present when row groups are filtered.");
                 }
+                currentRowGroupFirstRowIndex = nextRowPosition;
                 currentRowPosition = nextRowPosition;
             }
         }
 
+        private int getBachSize() throws IOException {
+
+            long rangeBatchSize = Long.MAX_VALUE;
+            if (this.currentRowGroupReadState.isFinished()) {
+                throw new IOException(
+                        "expecting more rows but reached last page block. Read "
+                                + rowsReturned
+                                + " out of "
+                                + totalRowCount);
+            } else if (!this.currentRowGroupReadState.isMaxRange()) {
+                long pageIndex = this.currentRowPosition - this.currentRowGroupFirstRowIndex;
+                rangeBatchSize = this.currentRowGroupReadState.currentRangeEnd() - pageIndex + 1;
+            }
+
+            return (int)
+                    Math.min(
+                            batchSize,
+                            Math.min(rangeBatchSize, totalCountLoadedSoFar - rowsReturned));
+        }
+
+        private long getNextRowPosition(int num) {
+            if (this.currentRowGroupReadState.isMaxRange()) {
+                return this.currentRowPosition + num;
+            } else {
+                long pageIndex = this.currentRowPosition - this.currentRowGroupFirstRowIndex;
+                long nextIndex = pageIndex + num;
+
+                if (this.currentRowGroupReadState.currentRangeEnd() < nextIndex) {
+                    this.currentRowGroupReadState.nextRange();
+                    nextIndex = this.currentRowGroupReadState.currentRangeStart();
+                }
+
+                return nextIndex;
+            }
+        }
+
         private ParquetReaderBatch getCachedEntry() throws IOException {
             try {
                 return pool.pollEntry();
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
index 7e2ab6d5e7f05..5e3f4a7e6a336 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
@@ -32,6 +32,7 @@
 import org.apache.parquet.column.page.DataPageV1;
 import org.apache.parquet.column.page.DataPageV2;
 import org.apache.parquet.column.page.DictionaryPage;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.column.page.PageReader;
 import org.apache.parquet.column.values.ValuesReader;
 import org.apache.parquet.io.ParquetDecodingException;
@@ -65,20 +66,16 @@ public abstract class AbstractColumnReader<VECTOR extends WritableColumnVector>
 
     protected final ColumnDescriptor descriptor;
 
-    /** Total number of values read. */
-    private long valuesRead;
-
-    /**
-     * value that indicates the end of the current page. That is, if valuesRead ==
-     * endOfPageValueCount, we are at the end of the page.
-     */
-    private long endOfPageValueCount;
-
     /** If true, the current page is dictionary encoded. */
     private boolean isCurrentPageDictionaryEncoded;
 
     /** Total values in the current page. */
-    private int pageValueCount;
+    //    private int pageValueCount;
+
+    /**
+     * Helper struct to track intermediate states while reading Parquet pages in the column chunk.
+     */
+    private final ParquetReadState readState;
 
     /*
      * Input streams:
@@ -101,12 +98,14 @@ public abstract class AbstractColumnReader<VECTOR extends WritableColumnVector>
     /** Dictionary decoder to wrap dictionary ids input stream. */
     private RunLengthDecoder dictionaryIdsDecoder;
 
-    public AbstractColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public AbstractColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
         this.descriptor = descriptor;
-        this.pageReader = pageReader;
+        this.pageReader = pageReadStore.getPageReader(descriptor);
         this.maxDefLevel = descriptor.getMaxDefinitionLevel();
 
+        this.readState = new ParquetReadState(pageReadStore.getRowIndexes().orElse(null));
+
         DictionaryPage dictionaryPage = pageReader.readDictionaryPage();
         if (dictionaryPage != null) {
             try {
@@ -147,56 +146,136 @@ public final void readToVector(int readNumber, VECTOR vector) throws IOException
         if (dictionary != null) {
             dictionaryIds = vector.reserveDictionaryIds(readNumber);
         }
-        while (readNumber > 0) {
+
+        readState.resetForNewBatch(readNumber);
+
+        while (readState.rowsToReadInBatch > 0) {
             // Compute the number of values we want to read in this page.
-            int leftInPage = (int) (endOfPageValueCount - valuesRead);
-            if (leftInPage == 0) {
-                DataPage page = pageReader.readPage();
-                if (page instanceof DataPageV1) {
-                    readPageV1((DataPageV1) page);
-                } else if (page instanceof DataPageV2) {
-                    readPageV2((DataPageV2) page);
-                } else {
-                    throw new RuntimeException("Unsupported page type: " + page.getClass());
+            if (readState.valuesToReadInPage == 0) {
+                int pageValueCount = readPage();
+                if (pageValueCount < 0) {
+                    // we've read all the pages; this could happen when we're reading a repeated
+                    // list and we
+                    // don't know where the list will end until we've seen all the pages.
+                    break;
                 }
-                leftInPage = (int) (endOfPageValueCount - valuesRead);
             }
-            int num = Math.min(readNumber, leftInPage);
-            if (isCurrentPageDictionaryEncoded) {
-                // Read and decode dictionary ids.
-                runLenDecoder.readDictionaryIds(
-                        num, dictionaryIds, vector, rowId, maxDefLevel, this.dictionaryIdsDecoder);
-
-                if (vector.hasDictionary() || (rowId == 0 && supportLazyDecode())) {
-                    // Column vector supports lazy decoding of dictionary values so just set the
-                    // dictionary.
-                    // We can't do this if rowId != 0 AND the column doesn't have a dictionary (i.e.
-                    // some
-                    // non-dictionary encoded values have already been added).
-                    vector.setDictionary(new ParquetDictionary(dictionary));
+
+            if (readState.isFinished()) {
+                break;
+            }
+
+            long pageRowId = readState.rowId;
+            int leftInBatch = readState.rowsToReadInBatch;
+            int leftInPage = readState.valuesToReadInPage;
+
+            int readBatch = Math.min(leftInBatch, leftInPage);
+
+            long rangeStart = readState.currentRangeStart();
+            long rangeEnd = readState.currentRangeEnd();
+
+            if (pageRowId < rangeStart) {
+                int toSkip = (int) (rangeStart - pageRowId);
+                if (toSkip >= leftInPage) { // drop page
+                    pageRowId += leftInPage;
+                    leftInPage = 0;
                 } else {
-                    readBatchFromDictionaryIds(rowId, num, vector, dictionaryIds);
+                    if (isCurrentPageDictionaryEncoded) {
+                        runLenDecoder.skipDictionaryIds(
+                                toSkip, maxDefLevel, this.dictionaryIdsDecoder);
+                        pageRowId += toSkip;
+                        leftInPage -= toSkip;
+                    } else {
+                        skipBatch(toSkip);
+                        pageRowId += toSkip;
+                        leftInPage -= toSkip;
+                    }
                 }
+            } else if (pageRowId > rangeEnd) {
+                readState.nextRange();
             } else {
-                if (vector.hasDictionary() && rowId != 0) {
-                    // This batch already has dictionary encoded values but this new page is not.
-                    // The batch
-                    // does not support a mix of dictionary and not so we will decode the
-                    // dictionary.
-                    readBatchFromDictionaryIds(0, rowId, vector, vector.getDictionaryIds());
+                long start = pageRowId;
+                long end = Math.min(rangeEnd, pageRowId + readBatch - 1);
+                int num = (int) (end - start + 1);
+
+                if (isCurrentPageDictionaryEncoded) {
+                    // Read and decode dictionary ids.
+                    runLenDecoder.readDictionaryIds(
+                            num,
+                            dictionaryIds,
+                            vector,
+                            rowId,
+                            maxDefLevel,
+                            this.dictionaryIdsDecoder);
+
+                    if (vector.hasDictionary() || (rowId == 0 && supportLazyDecode())) {
+                        // Column vector supports lazy decoding of dictionary values so just set the
+                        // dictionary.
+                        // We can't do this if rowId != 0 AND the column doesn't have a dictionary
+                        // (i.e.
+                        // some
+                        // non-dictionary encoded values have already been added).
+                        vector.setDictionary(new ParquetDictionary(dictionary));
+                    } else {
+                        readBatchFromDictionaryIds(rowId, num, vector, dictionaryIds);
+                    }
+                } else {
+                    if (vector.hasDictionary() && rowId != 0) {
+                        // This batch already has dictionary encoded values but this new page is
+                        // not.
+                        // The batch
+                        // does not support a mix of dictionary and not so we will decode the
+                        // dictionary.
+                        readBatchFromDictionaryIds(0, rowId, vector, vector.getDictionaryIds());
+                    }
+                    vector.setDictionary(null);
+                    readBatch(rowId, num, vector);
                 }
-                vector.setDictionary(null);
-                readBatch(rowId, num, vector);
+                leftInBatch -= num;
+                pageRowId += num;
+                leftInPage -= num;
+                rowId += num;
             }
+            readState.rowsToReadInBatch = leftInBatch;
+            readState.valuesToReadInPage = leftInPage;
+            readState.rowId = pageRowId;
+        }
+    }
 
-            valuesRead += num;
-            rowId += num;
-            readNumber -= num;
+    private int readPage() {
+        DataPage page = pageReader.readPage();
+        if (page == null) {
+            return -1;
         }
+        long pageFirstRowIndex = page.getFirstRowIndex().orElse(0L);
+
+        int pageValueCount =
+                page.accept(
+                        new DataPage.Visitor<Integer>() {
+                            @Override
+                            public Integer visit(DataPageV1 dataPageV1) {
+                                try {
+                                    return readPageV1(dataPageV1);
+                                } catch (IOException e) {
+                                    throw new RuntimeException(e);
+                                }
+                            }
+
+                            @Override
+                            public Integer visit(DataPageV2 dataPageV2) {
+                                try {
+                                    return readPageV2(dataPageV2);
+                                } catch (IOException e) {
+                                    throw new RuntimeException(e);
+                                }
+                            }
+                        });
+        readState.resetForNewPage(pageValueCount, pageFirstRowIndex);
+        return pageValueCount;
     }
 
-    private void readPageV1(DataPageV1 page) throws IOException {
-        this.pageValueCount = page.getValueCount();
+    private int readPageV1(DataPageV1 page) throws IOException {
+        int pageValueCount = page.getValueCount();
         ValuesReader rlReader = page.getRlEncoding().getValuesReader(descriptor, REPETITION_LEVEL);
 
         // Initialize the decoders.
@@ -211,30 +290,31 @@ private void readPageV1(DataPageV1 page) throws IOException {
             ByteBufferInputStream in = bytes.toInputStream();
             rlReader.initFromPage(pageValueCount, in);
             this.runLenDecoder.initFromStream(pageValueCount, in);
-            prepareNewPage(page.getValueEncoding(), in);
+            prepareNewPage(page.getValueEncoding(), in, pageValueCount);
+            return pageValueCount;
         } catch (IOException e) {
             throw new IOException("could not read page " + page + " in col " + descriptor, e);
         }
     }
 
-    private void readPageV2(DataPageV2 page) throws IOException {
-        this.pageValueCount = page.getValueCount();
+    private int readPageV2(DataPageV2 page) throws IOException {
+        int pageValueCount = page.getValueCount();
 
         int bitWidth = BytesUtils.getWidthFromMaxInt(descriptor.getMaxDefinitionLevel());
         // do not read the length from the stream. v2 pages handle dividing the page bytes.
         this.runLenDecoder = new RunLengthDecoder(bitWidth, false);
         this.runLenDecoder.initFromStream(
-                this.pageValueCount, page.getDefinitionLevels().toInputStream());
+                pageValueCount, page.getDefinitionLevels().toInputStream());
         try {
-            prepareNewPage(page.getDataEncoding(), page.getData().toInputStream());
+            prepareNewPage(page.getDataEncoding(), page.getData().toInputStream(), pageValueCount);
+            return pageValueCount;
         } catch (IOException e) {
             throw new IOException("could not read page " + page + " in col " + descriptor, e);
         }
     }
 
-    private void prepareNewPage(Encoding dataEncoding, ByteBufferInputStream in)
+    private void prepareNewPage(Encoding dataEncoding, ByteBufferInputStream in, int pageValueCount)
             throws IOException {
-        this.endOfPageValueCount = valuesRead + pageValueCount;
         if (dataEncoding.usesDictionary()) {
             if (dictionary == null) {
                 throw new IOException(
@@ -269,6 +349,14 @@ private void prepareNewPage(Encoding dataEncoding, ByteBufferInputStream in)
         afterReadPage();
     }
 
+    final void skipDataBuffer(int length) {
+        try {
+            dataInputStream.skipFully(length);
+        } catch (IOException e) {
+            throw new ParquetDecodingException("Failed to skip " + length + " bytes", e);
+        }
+    }
+
     final ByteBuffer readDataBuffer(int length) {
         try {
             return dataInputStream.slice(length).order(ByteOrder.LITTLE_ENDIAN);
@@ -291,6 +379,8 @@ protected boolean supportLazyDecode() {
     /** Read batch from {@link #runLenDecoder} and {@link #dataInputStream}. */
     protected abstract void readBatch(int rowId, int num, VECTOR column);
 
+    protected abstract void skipBatch(int num);
+
     /**
      * Decode dictionary ids to data. From {@link #runLenDecoder} and {@link #dictionaryIdsDecoder}.
      */
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
index d5dc231d8436d..83d3c5a07d4b6 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.io.ParquetDecodingException;
 import org.apache.parquet.schema.PrimitiveType;
 
@@ -36,9 +36,9 @@ public class BooleanColumnReader extends AbstractColumnReader<WritableBooleanVec
 
     private byte currentByte = 0;
 
-    public BooleanColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public BooleanColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.BOOLEAN);
     }
 
@@ -94,6 +94,36 @@ protected void readBatch(int rowId, int num, WritableBooleanVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        for (int i = 0; i < n; i++) {
+                            readBoolean();
+                        }
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            readBoolean();
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
     private boolean readBoolean() {
         if (bitOffset == 0) {
             try {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ByteColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ByteColumnReader.java
index bed9923d9be35..804b8bc0275ea 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ByteColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ByteColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -31,8 +31,9 @@
 /** Byte {@link ColumnReader}. Using INT32 to store byte, so just cast int to byte. */
 public class ByteColumnReader extends AbstractColumnReader<WritableByteVector> {
 
-    public ByteColumnReader(ColumnDescriptor descriptor, PageReader pageReader) throws IOException {
-        super(descriptor, pageReader);
+    public ByteColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
+            throws IOException {
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.INT32);
     }
 
@@ -69,6 +70,38 @@ protected void readBatch(int rowId, int num, WritableByteVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipByte(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipByte(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipByte(int num) {
+        skipDataBuffer(4 * num);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableByteVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BytesColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BytesColumnReader.java
index e83115c8a69f4..6ee395e585684 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BytesColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BytesColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -31,9 +31,9 @@
 /** Bytes {@link ColumnReader}. A int length and bytes data. */
 public class BytesColumnReader extends AbstractColumnReader<WritableBytesVector> {
 
-    public BytesColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public BytesColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.BINARY);
     }
 
@@ -70,6 +70,41 @@ protected void readBatch(int rowId, int num, WritableBytesVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipBinary(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipBinary(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipBinary(int num) {
+        for (int i = 0; i < num; i++) {
+            int len = readDataBuffer(4).getInt();
+            skipDataBuffer(len);
+        }
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableBytesVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/DoubleColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/DoubleColumnReader.java
index d6d8aa2bbb22b..2cffd406248e5 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/DoubleColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/DoubleColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -31,9 +31,9 @@
 /** Double {@link ColumnReader}. */
 public class DoubleColumnReader extends AbstractColumnReader<WritableDoubleVector> {
 
-    public DoubleColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public DoubleColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.DOUBLE);
     }
 
@@ -70,6 +70,38 @@ protected void readBatch(int rowId, int num, WritableDoubleVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipDouble(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipDouble(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipDouble(int num) {
+        skipDataBuffer(8 * num);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableDoubleVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FixedLenBytesColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FixedLenBytesColumnReader.java
index afce717a67197..25e1b466e4658 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FixedLenBytesColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FixedLenBytesColumnReader.java
@@ -25,7 +25,7 @@
 import org.apache.paimon.format.parquet.ParquetSchemaConverter;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.io.api.Binary;
 import org.apache.parquet.schema.PrimitiveType;
 
@@ -39,8 +39,9 @@ public class FixedLenBytesColumnReader<VECTOR extends WritableColumnVector>
     private final int precision;
 
     public FixedLenBytesColumnReader(
-            ColumnDescriptor descriptor, PageReader pageReader, int precision) throws IOException {
-        super(descriptor, pageReader);
+            ColumnDescriptor descriptor, PageReadStore pageReadStore, int precision)
+            throws IOException {
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.FIXED_LEN_BYTE_ARRAY);
         this.precision = precision;
     }
@@ -79,6 +80,35 @@ protected void readBatch(int rowId, int num, VECTOR column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int bytesLen = descriptor.getPrimitiveType().getTypeLength();
+        if (ParquetSchemaConverter.is32BitDecimal(precision)) {
+            for (int i = 0; i < num; i++) {
+                if (runLenDecoder.readInteger() == maxDefLevel) {
+                    skipDataBinary(bytesLen);
+                }
+            }
+        } else if (ParquetSchemaConverter.is64BitDecimal(precision)) {
+
+            for (int i = 0; i < num; i++) {
+                if (runLenDecoder.readInteger() == maxDefLevel) {
+                    skipDataBinary(bytesLen);
+                }
+            }
+        } else {
+            for (int i = 0; i < num; i++) {
+                if (runLenDecoder.readInteger() == maxDefLevel) {
+                    skipDataBinary(bytesLen);
+                }
+            }
+        }
+    }
+
+    private void skipDataBinary(int len) {
+        skipDataBuffer(len);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, VECTOR column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FloatColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FloatColumnReader.java
index 1f4adfa4b9c8c..e9eec13df5fc5 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FloatColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/FloatColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -31,9 +31,9 @@
 /** Float {@link ColumnReader}. */
 public class FloatColumnReader extends AbstractColumnReader<WritableFloatVector> {
 
-    public FloatColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public FloatColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.FLOAT);
     }
 
@@ -70,6 +70,38 @@ protected void readBatch(int rowId, int num, WritableFloatVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipFloat(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipFloat(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipFloat(int num) {
+        skipDataBuffer(4 * num);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableFloatVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/IntColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/IntColumnReader.java
index e38e916d187e6..521ad998f6f1f 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/IntColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/IntColumnReader.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.data.columnar.writable.WritableIntVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -30,8 +30,9 @@
 /** Int {@link ColumnReader}. */
 public class IntColumnReader extends AbstractColumnReader<WritableIntVector> {
 
-    public IntColumnReader(ColumnDescriptor descriptor, PageReader pageReader) throws IOException {
-        super(descriptor, pageReader);
+    public IntColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
+            throws IOException {
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.INT32);
     }
 
@@ -68,6 +69,38 @@ protected void readBatch(int rowId, int num, WritableIntVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipInteger(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipInteger(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipInteger(int num) {
+        skipDataBuffer(4 * num);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableIntVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/LongColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/LongColumnReader.java
index a8e04eae673af..c4af086a7026a 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/LongColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/LongColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableLongVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -31,8 +31,9 @@
 /** Long {@link ColumnReader}. */
 public class LongColumnReader extends AbstractColumnReader<WritableLongVector> {
 
-    public LongColumnReader(ColumnDescriptor descriptor, PageReader pageReader) throws IOException {
-        super(descriptor, pageReader);
+    public LongColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
+            throws IOException {
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.INT64);
     }
 
@@ -69,6 +70,38 @@ protected void readBatch(int rowId, int num, WritableLongVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipValue(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipValue(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipValue(int num) {
+        skipDataBuffer(num * 8);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableLongVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
index 68225fbd13207..8f20be2754471 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedColumnReader.java
@@ -279,7 +279,7 @@ private Pair<LevelDelegation, WritableColumnVector> readPrimitive(
             reader =
                     new NestedPrimitiveColumnReader(
                             descriptor,
-                            pages.getPageReader(descriptor),
+                            pages,
                             isUtcTimestamp,
                             descriptor.getPrimitiveType(),
                             field.getType(),
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
index 7d00ff79234ae..7db7aedbf6aee 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
@@ -44,6 +44,7 @@
 import org.apache.parquet.column.page.DataPageV1;
 import org.apache.parquet.column.page.DataPageV2;
 import org.apache.parquet.column.page.DictionaryPage;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.column.page.PageReader;
 import org.apache.parquet.column.values.ValuesReader;
 import org.apache.parquet.column.values.rle.RunLengthBitPackingHybridDecoder;
@@ -82,15 +83,6 @@ public class NestedPrimitiveColumnReader implements ColumnReader<WritableColumnV
 
     private final boolean isUtcTimestamp;
 
-    /** Total number of values read. */
-    private long valuesRead;
-
-    /**
-     * value that indicates the end of the current page. That is, if valuesRead ==
-     * endOfPageValueCount, we are at the end of the page.
-     */
-    private long endOfPageValueCount;
-
     /** If true, the current page is dictionary encoded. */
     private boolean isCurrentPageDictionaryEncoded;
 
@@ -104,7 +96,12 @@ public class NestedPrimitiveColumnReader implements ColumnReader<WritableColumnV
     private ParquetDataColumnReader dataColumn;
 
     /** Total values in the current page. */
-    private int pageValueCount;
+    //    private int pageValueCount;
+
+    /**
+     * Helper struct to track intermediate states while reading Parquet pages in the column chunk.
+     */
+    protected final ParquetReadState readState;
 
     // flag to indicate if there is no data in parquet data page
     private boolean eof = false;
@@ -115,7 +112,7 @@ public class NestedPrimitiveColumnReader implements ColumnReader<WritableColumnV
 
     public NestedPrimitiveColumnReader(
             ColumnDescriptor descriptor,
-            PageReader pageReader,
+            PageReadStore pageReadStore,
             boolean isUtcTimestamp,
             Type parquetType,
             DataType dataType,
@@ -124,7 +121,7 @@ public NestedPrimitiveColumnReader(
             throws IOException {
         this.descriptor = descriptor;
         this.type = parquetType;
-        this.pageReader = pageReader;
+        this.pageReader = pageReadStore.getPageReader(descriptor);
         this.maxDefLevel = descriptor.getMaxDefinitionLevel();
         this.isUtcTimestamp = isUtcTimestamp;
         this.dataType = dataType;
@@ -132,6 +129,9 @@ public NestedPrimitiveColumnReader(
         this.readMapKey = readMapKey;
 
         DictionaryPage dictionaryPage = pageReader.readDictionaryPage();
+
+        this.readState = new ParquetReadState(pageReadStore.getRowIndexes().orElse(null));
+
         if (dictionaryPage != null) {
             try {
                 this.dictionary =
@@ -166,23 +166,55 @@ public WritableColumnVector readAndNewVector(int readNumber, WritableColumnVecto
             isFirstRow = false;
         }
 
-        // index to set value.
-        int index = 0;
-        int valueIndex = 0;
         List<Object> valueList = new ArrayList<>();
 
+        int valueIndex = collectDataFromParquetPage(readNumber, valueList);
+
+        return fillColumnVector(valueIndex, valueList);
+    }
+
+    private int collectDataFromParquetPage(int total, List<Object> valueList) throws IOException {
+        int valueIndex = 0;
         // repeated type need two loops to read data.
-        while (!eof && index < readNumber) {
+
+        readState.resetForNewBatch(total);
+
+        while (!eof && readState.rowsToReadInBatch > 0) {
+
+            if (readState.isFinished()) { // finished to read
+                eof = true;
+                break;
+            }
+
+            long pageRowId = readState.rowId;
+            long rangeStart = readState.currentRangeStart();
+            long rangeEnd = readState.currentRangeEnd();
+
+            if (pageRowId > rangeEnd) {
+                readState.nextRange();
+                continue;
+            }
+
+            boolean needFilterSkip = pageRowId < rangeStart;
+
             do {
-                if (!lastValue.shouldSkip) {
+
+                if (!lastValue.shouldSkip && !needFilterSkip) {
                     valueList.add(lastValue.value);
                     valueIndex++;
                 }
             } while (readValue() && (repetitionLevel != 0));
-            index++;
+
+            if (pageRowId == readState.rowId) {
+                readState.rowId = readState.rowId + 1;
+            }
+
+            if (!needFilterSkip) {
+                readState.rowsToReadInBatch = readState.rowsToReadInBatch - 1;
+            }
         }
 
-        return fillColumnVector(valueIndex, valueList);
+        return valueIndex;
     }
 
     public LevelDelegation getLevelDelegation() {
@@ -255,20 +287,24 @@ private void readAndSaveRepetitionAndDefinitionLevels() {
         // get the values of repetition and definitionLevel
         repetitionLevel = repetitionLevelColumn.nextInt();
         definitionLevel = definitionLevelColumn.nextInt();
-        valuesRead++;
+        readState.valuesToReadInPage = readState.valuesToReadInPage - 1;
         repetitionLevelList.add(repetitionLevel);
         definitionLevelList.add(definitionLevel);
     }
 
     private int readPageIfNeed() throws IOException {
         // Compute the number of values we want to read in this page.
-        int leftInPage = (int) (endOfPageValueCount - valuesRead);
-        if (leftInPage == 0) {
-            // no data left in current page, load data from new page
-            readPage();
-            leftInPage = (int) (endOfPageValueCount - valuesRead);
+        if (readState.valuesToReadInPage == 0) {
+            int pageValueCount = readPage();
+            // 返回当前 page 的数据量
+            if (pageValueCount < 0) {
+                // we've read all the pages; this could happen when we're reading a repeated list
+                // and we
+                // don't know where the list will end until we've seen all the pages.
+                return -1;
+            }
         }
-        return leftInPage;
+        return readState.valuesToReadInPage;
     }
 
     private Object readPrimitiveTypedRow(DataType category) {
@@ -528,33 +564,36 @@ private static HeapBytesVector getHeapBytesVector(int total, List valueList) {
         return phbv;
     }
 
-    protected void readPage() {
+    protected int readPage() {
         DataPage page = pageReader.readPage();
 
         if (page == null) {
-            return;
+            return -1;
         }
 
-        page.accept(
-                new DataPage.Visitor<Void>() {
-                    @Override
-                    public Void visit(DataPageV1 dataPageV1) {
-                        readPageV1(dataPageV1);
-                        return null;
-                    }
+        long pageFirstRowIndex = page.getFirstRowIndex().orElse(0L);
 
-                    @Override
-                    public Void visit(DataPageV2 dataPageV2) {
-                        readPageV2(dataPageV2);
-                        return null;
-                    }
-                });
+        int pageValueCount =
+                page.accept(
+                        new DataPage.Visitor<Integer>() {
+                            @Override
+                            public Integer visit(DataPageV1 dataPageV1) {
+                                return readPageV1(dataPageV1);
+                            }
+
+                            @Override
+                            public Integer visit(DataPageV2 dataPageV2) {
+                                return readPageV2(dataPageV2);
+                            }
+                        });
+        readState.resetForNewPage(pageValueCount, pageFirstRowIndex);
+        return pageValueCount;
     }
 
     private void initDataReader(Encoding dataEncoding, ByteBufferInputStream in, int valueCount)
             throws IOException {
-        this.pageValueCount = valueCount;
-        this.endOfPageValueCount = valuesRead + pageValueCount;
+        //        this.pageValueCount = valueCount;
+        //        this.endOfPageValueCount = valuesRead + pageValueCount;
         if (dataEncoding.usesDictionary()) {
             this.dataColumn = null;
             if (dictionary == null) {
@@ -577,13 +616,14 @@ private void initDataReader(Encoding dataEncoding, ByteBufferInputStream in, int
         }
 
         try {
-            dataColumn.initFromPage(pageValueCount, in);
+            dataColumn.initFromPage(valueCount, in);
         } catch (IOException e) {
             throw new IOException(String.format("Could not read page in col %s.", descriptor), e);
         }
     }
 
-    private void readPageV1(DataPageV1 page) {
+    private int readPageV1(DataPageV1 page) {
+        int pageValueCount = page.getValueCount();
         ValuesReader rlReader = page.getRlEncoding().getValuesReader(descriptor, REPETITION_LEVEL);
         ValuesReader dlReader = page.getDlEncoding().getValuesReader(descriptor, DEFINITION_LEVEL);
         this.repetitionLevelColumn = new ValuesReaderIntIterator(rlReader);
@@ -597,15 +637,16 @@ private void readPageV1(DataPageV1 page) {
             LOG.debug("Reading definition levels at {}.", in.position());
             dlReader.initFromPage(pageValueCount, in);
             LOG.debug("Reading data at {}.", in.position());
-            initDataReader(page.getValueEncoding(), in, page.getValueCount());
+            initDataReader(page.getValueEncoding(), in, pageValueCount);
+            return pageValueCount;
         } catch (IOException e) {
             throw new ParquetDecodingException(
                     String.format("Could not read page %s in col %s.", page, descriptor), e);
         }
     }
 
-    private void readPageV2(DataPageV2 page) {
-        this.pageValueCount = page.getValueCount();
+    private int readPageV2(DataPageV2 page) {
+        int pageValueCount = page.getValueCount();
         this.repetitionLevelColumn =
                 newRLEIterator(descriptor.getMaxRepetitionLevel(), page.getRepetitionLevels());
         this.definitionLevelColumn =
@@ -615,8 +656,8 @@ private void readPageV2(DataPageV2 page) {
                     "Page data size {} bytes and {} records.",
                     page.getData().size(),
                     pageValueCount);
-            initDataReader(
-                    page.getDataEncoding(), page.getData().toInputStream(), page.getValueCount());
+            initDataReader(page.getDataEncoding(), page.getData().toInputStream(), pageValueCount);
+            return pageValueCount;
         } catch (IOException e) {
             throw new ParquetDecodingException(
                     String.format("Could not read page %s in col %s.", page, descriptor), e);
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java
new file mode 100644
index 0000000000000..a6003676825a1
--- /dev/null
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java
@@ -0,0 +1,148 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.format.parquet.reader;
+
+import java.util.ArrayList;
+import java.util.Iterator;
+import java.util.List;
+import java.util.PrimitiveIterator;
+
+/** Parquet reader state for column index. */
+public class ParquetReadState {
+    /** A special row range used when there is no row indexes (hence all rows must be included). */
+    private static final RowRange MAX_ROW_RANGE = new RowRange(Long.MIN_VALUE, Long.MAX_VALUE);
+
+    /**
+     * A special row range used when the row indexes are present AND all the row ranges have been
+     * processed. This serves as a sentinel at the end indicating that all rows come after the last
+     * row range should be skipped.
+     */
+    private static final RowRange END_ROW_RANGE = new RowRange(Long.MAX_VALUE, Long.MIN_VALUE);
+
+    private final Iterator<RowRange> rowRanges;
+
+    private RowRange currentRange;
+
+    /** row index for the next read. */
+    long rowId;
+
+    int valuesToReadInPage;
+    int rowsToReadInBatch;
+
+    public ParquetReadState(PrimitiveIterator.OfLong rowIndexes) {
+        this.rowRanges = constructRanges(rowIndexes);
+        nextRange();
+    }
+
+    /**
+     * Construct a list of row ranges from the given `rowIndexes`. For example, suppose the
+     * `rowIndexes` are `[0, 1, 2, 4, 5, 7, 8, 9]`, it will be converted into 3 row ranges: `[0-2],
+     * [4-5], [7-9]`.
+     */
+    private Iterator<RowRange> constructRanges(PrimitiveIterator.OfLong rowIndexes) {
+        if (rowIndexes == null) {
+            return null;
+        }
+
+        List<RowRange> rowRanges = new ArrayList<>();
+        long currentStart = Long.MIN_VALUE;
+        long previous = Long.MIN_VALUE;
+
+        while (rowIndexes.hasNext()) {
+            long idx = rowIndexes.nextLong();
+            if (currentStart == Long.MIN_VALUE) {
+                currentStart = idx;
+            } else if (previous + 1 != idx) {
+                RowRange range = new RowRange(currentStart, previous);
+                rowRanges.add(range);
+                currentStart = idx;
+            }
+            previous = idx;
+        }
+
+        if (previous != Long.MIN_VALUE) {
+            rowRanges.add(new RowRange(currentStart, previous));
+        }
+
+        return rowRanges.iterator();
+    }
+
+    /** Must be called at the beginning of reading a new batch. */
+    void resetForNewBatch(int batchSize) {
+        this.rowsToReadInBatch = batchSize;
+    }
+
+    /** Must be called at the beginning of reading a new page. */
+    void resetForNewPage(int totalValuesInPage, long pageFirstRowIndex) {
+        this.valuesToReadInPage = totalValuesInPage;
+        this.rowId = pageFirstRowIndex;
+    }
+
+    /** Returns the start index of the current row range. */
+    public long currentRangeStart() {
+        return currentRange.start;
+    }
+
+    /** Returns the end index of the current row range. */
+    public long currentRangeEnd() {
+        return currentRange.end;
+    }
+
+    public boolean isFinished() {
+        return this.currentRange.equals(this.END_ROW_RANGE);
+    }
+
+    public boolean isMaxRange() {
+        return this.currentRange.equals(this.MAX_ROW_RANGE);
+    }
+
+    public RowRange getCurrentRange() {
+        return currentRange;
+    }
+
+    /** Advance to the next range. */
+    public void nextRange() {
+        if (rowRanges == null) {
+            currentRange = MAX_ROW_RANGE;
+        } else if (!rowRanges.hasNext()) {
+            currentRange = END_ROW_RANGE;
+        } else {
+            currentRange = rowRanges.next();
+        }
+    }
+
+    /** Helper struct to represent a range of row indexes `[start, end]`. */
+    public static class RowRange {
+        final long start;
+        final long end;
+
+        RowRange(long start, long end) {
+            this.start = start;
+            this.end = end;
+        }
+
+        @Override
+        public boolean equals(Object obj) {
+            if (!(obj instanceof RowRange)) {
+                return false;
+            }
+            return ((RowRange) obj).start == this.start && ((RowRange) obj).end == this.end;
+        }
+    }
+}
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetSplitReaderUtil.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetSplitReaderUtil.java
index 860ec54fa88b0..a2be77414d5ac 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetSplitReaderUtil.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetSplitReaderUtil.java
@@ -87,58 +87,45 @@ public static ColumnReader createColumnReader(
                 getAllColumnDescriptorByType(depth, type, columnDescriptors);
         switch (fieldType.getTypeRoot()) {
             case BOOLEAN:
-                return new BooleanColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new BooleanColumnReader(descriptors.get(0), pages);
             case TINYINT:
-                return new ByteColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new ByteColumnReader(descriptors.get(0), pages);
             case DOUBLE:
-                return new DoubleColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new DoubleColumnReader(descriptors.get(0), pages);
             case FLOAT:
-                return new FloatColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new FloatColumnReader(descriptors.get(0), pages);
             case INTEGER:
             case DATE:
             case TIME_WITHOUT_TIME_ZONE:
-                return new IntColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new IntColumnReader(descriptors.get(0), pages);
             case BIGINT:
-                return new LongColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new LongColumnReader(descriptors.get(0), pages);
             case SMALLINT:
-                return new ShortColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new ShortColumnReader(descriptors.get(0), pages);
             case CHAR:
             case VARCHAR:
             case BINARY:
             case VARBINARY:
-                return new BytesColumnReader(
-                        descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new BytesColumnReader(descriptors.get(0), pages);
             case TIMESTAMP_WITHOUT_TIME_ZONE:
             case TIMESTAMP_WITH_LOCAL_TIME_ZONE:
                 if (descriptors.get(0).getPrimitiveType().getPrimitiveTypeName()
                         == PrimitiveType.PrimitiveTypeName.INT64) {
-                    return new LongColumnReader(
-                            descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                    return new LongColumnReader(descriptors.get(0), pages);
                 }
-                return new TimestampColumnReader(
-                        true, descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                return new TimestampColumnReader(true, descriptors.get(0), pages);
             case DECIMAL:
                 switch (descriptors.get(0).getPrimitiveType().getPrimitiveTypeName()) {
                     case INT32:
-                        return new IntColumnReader(
-                                descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                        return new IntColumnReader(descriptors.get(0), pages);
                     case INT64:
-                        return new LongColumnReader(
-                                descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                        return new LongColumnReader(descriptors.get(0), pages);
                     case BINARY:
-                        return new BytesColumnReader(
-                                descriptors.get(0), pages.getPageReader(descriptors.get(0)));
+                        return new BytesColumnReader(descriptors.get(0), pages);
                     case FIXED_LEN_BYTE_ARRAY:
                         return new FixedLenBytesColumnReader(
                                 descriptors.get(0),
-                                pages.getPageReader(descriptors.get(0)),
+                                pages,
                                 ((DecimalType) fieldType).getPrecision());
                 }
             case ARRAY:
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RunLengthDecoder.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RunLengthDecoder.java
index 2dd1655d571f0..ebb8f28fa1eee 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RunLengthDecoder.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/RunLengthDecoder.java
@@ -194,6 +194,51 @@ private void readDictionaryIdData(int total, WritableIntVector c, int rowId) {
         }
     }
 
+    void skipDictionaryIds(int total, int level, RunLengthDecoder data) {
+        int left = total;
+        while (left > 0) {
+            if (this.currentCount == 0) {
+                this.readNextGroup();
+            }
+            int n = Math.min(left, this.currentCount);
+            switch (mode) {
+                case RLE:
+                    if (currentValue == level) {
+                        data.skipDictionaryIdData(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (currentBuffer[currentBufferIdx++] == level) {
+                            data.readInteger();
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            currentCount -= n;
+        }
+    }
+
+    private void skipDictionaryIdData(int total) {
+        int left = total;
+        while (left > 0) {
+            if (this.currentCount == 0) {
+                this.readNextGroup();
+            }
+            int n = Math.min(left, this.currentCount);
+            switch (mode) {
+                case RLE:
+                    break;
+                case PACKED:
+                    currentBufferIdx += n;
+                    break;
+            }
+            left -= n;
+            currentCount -= n;
+        }
+    }
+
     /** Reads the next varint encoded int. */
     private int readUnsignedVarInt() throws IOException {
         int value = 0;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ShortColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ShortColumnReader.java
index 7b32232261a7b..bdb2f401fa3f3 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ShortColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ShortColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.data.columnar.writable.WritableShortVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.schema.PrimitiveType;
 
 import java.io.IOException;
@@ -30,9 +30,9 @@
 /** Short {@link ColumnReader}. Using INT32 to store short, so just cast int to short. */
 public class ShortColumnReader extends AbstractColumnReader<WritableShortVector> {
 
-    public ShortColumnReader(ColumnDescriptor descriptor, PageReader pageReader)
+    public ShortColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         checkTypeName(PrimitiveType.PrimitiveTypeName.INT32);
     }
 
@@ -71,6 +71,38 @@ protected void readBatch(int rowId, int num, WritableShortVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        int left = num;
+        while (left > 0) {
+            if (runLenDecoder.currentCount == 0) {
+                runLenDecoder.readNextGroup();
+            }
+            int n = Math.min(left, runLenDecoder.currentCount);
+            switch (runLenDecoder.mode) {
+                case RLE:
+                    if (runLenDecoder.currentValue == maxDefLevel) {
+                        skipShot(n);
+                    }
+                    break;
+                case PACKED:
+                    for (int i = 0; i < n; ++i) {
+                        if (runLenDecoder.currentBuffer[runLenDecoder.currentBufferIdx++]
+                                == maxDefLevel) {
+                            skipShot(1);
+                        }
+                    }
+                    break;
+            }
+            left -= n;
+            runLenDecoder.currentCount -= n;
+        }
+    }
+
+    private void skipShot(int num) {
+        skipDataBuffer(4 * num);
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableShortVector column, WritableIntVector dictionaryIds) {
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
index 4a279ff90e15f..8767173315c24 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
@@ -23,7 +23,7 @@
 import org.apache.paimon.data.columnar.writable.WritableTimestampVector;
 
 import org.apache.parquet.column.ColumnDescriptor;
-import org.apache.parquet.column.page.PageReader;
+import org.apache.parquet.column.page.PageReadStore;
 import org.apache.parquet.io.api.Binary;
 import org.apache.parquet.schema.PrimitiveType;
 
@@ -49,9 +49,9 @@ public class TimestampColumnReader extends AbstractColumnReader<WritableTimestam
     private final boolean utcTimestamp;
 
     public TimestampColumnReader(
-            boolean utcTimestamp, ColumnDescriptor descriptor, PageReader pageReader)
+            boolean utcTimestamp, ColumnDescriptor descriptor, PageReadStore pageReadStore)
             throws IOException {
-        super(descriptor, pageReader);
+        super(descriptor, pageReadStore);
         this.utcTimestamp = utcTimestamp;
         checkTypeName(PrimitiveType.PrimitiveTypeName.INT96);
     }
@@ -75,6 +75,15 @@ protected void readBatch(int rowId, int num, WritableTimestampVector column) {
         }
     }
 
+    @Override
+    protected void skipBatch(int num) {
+        for (int i = 0; i < num; i++) {
+            if (runLenDecoder.readInteger() == maxDefLevel) {
+                skipDataBuffer(12);
+            }
+        }
+    }
+
     @Override
     protected void readBatchFromDictionaryIds(
             int rowId, int num, WritableTimestampVector column, WritableIntVector dictionaryIds) {

From 79602cd61aa084672794faa8aeed3d4d889c852a Mon Sep 17 00:00:00 2001
From: Kerwin <37063904+zhuangchong@users.noreply.github.com>
Date: Tue, 3 Dec 2024 23:20:15 +0800
Subject: [PATCH 099/157] [doc] Add data types in concept (#4625)

---
 docs/content/concepts/data-types.md           | 179 ++++++++++++++++++
 docs/content/concepts/spec/_index.md          |   2 +-
 .../generated/format_table_configuration.html |  36 ++++
 .../ConfigOptionsDocGenerator.java            |   1 +
 4 files changed, 217 insertions(+), 1 deletion(-)
 create mode 100644 docs/content/concepts/data-types.md
 create mode 100644 docs/layouts/shortcodes/generated/format_table_configuration.html

diff --git a/docs/content/concepts/data-types.md b/docs/content/concepts/data-types.md
new file mode 100644
index 0000000000000..b33dcd428399b
--- /dev/null
+++ b/docs/content/concepts/data-types.md
@@ -0,0 +1,179 @@
+---
+title: "Data Types"
+weight: 7
+type: docs
+aliases:
+- /concepts/data-types.html
+---
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+# Data Types
+
+A data type describes the logical type of a value in the table ecosystem. It can be used to declare input and/or output types of operations.
+
+All data types supported by Paimon are as follows:
+
+<table class="table table-bordered">
+    <thead>
+    <tr>
+      <th class="text-left" style="width: 10%">DataType</th>
+      <th class="text-left" style="width: 30%">Description</th>
+    </tr>
+    </thead>
+    <tbody>
+    <tr>
+      <td><code>BOOLEAN</code></td>
+      <td><code>Data type of a boolean with a (possibly) three-valued logic of TRUE, FALSE, and UNKNOWN.</code></td>
+    </tr>
+    <tr>
+      <td><code>CHAR</code><br>
+          <code>CHAR(n)</code>
+      </td>
+      <td><code>Data type of a fixed-length character string.</code><br><br>
+          <code>The type can be declared using CHAR(n) where n is the number of code points. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1. </code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>VARCHAR</code><br>
+          <code>VARCHAR(n)</code><br><br>
+          <code>STRING</code>
+      </td>
+      <td><code>Data type of a variable-length character string.</code><br><br>
+          <code>The type can be declared using VARCHAR(n) where n is the maximum number of code points. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1. </code><br><br>
+          <code>STRING is a synonym for VARCHAR(2147483647).</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>BINARY</code><br>
+          <code>BINARY(n)</code><br><br>
+      </td>
+      <td><code>Data type of a fixed-length binary string (=a sequence of bytes).</code><br><br>
+          <code>The type can be declared using BINARY(n) where n is the number of bytes. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>VARBINARY</code><br>
+          <code>VARBINARY(n)</code><br><br>
+          <code>BYTES</code>
+      </td>
+      <td><code>Data type of a variable-length binary string (=a sequence of bytes).</code><br><br>
+          <code>The type can be declared using VARBINARY(n) where n is the maximum number of bytes. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.</code><br><br>
+          <code>BYTES is a synonym for VARBINARY(2147483647).</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>DECIMAL</code><br>
+          <code>DECIMAL(p)</code><br>
+          <code>DECIMAL(p, s)</code>
+      </td>
+      <td><code>Data type of a decimal number with fixed precision and scale.</code><br><br>
+          <code>The type can be declared using DECIMAL(p, s) where p is the number of digits in a number (precision) and s is the number of digits to the right of the decimal point in a number (scale). p must have a value between 1 and 38 (both inclusive). s must have a value between 0 and p (both inclusive). The default value for p is 10. The default value for s is 0.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>TINYINT</code></td>
+      <td><code>Data type of a 1-byte signed integer with values from -128 to 127.</code></td>
+    </tr>
+    <tr>
+      <td><code>SMALLINT</code></td>
+      <td><code>Data type of a 2-byte signed integer with values from -32,768 to 32,767.</code></td>
+    </tr>
+    <tr>
+      <td><code>INT</code></td>
+      <td><code>Data type of a 4-byte signed integer with values from -2,147,483,648 to 2,147,483,647.</code></td>
+    </tr>
+    <tr>
+      <td><code>BIGINT</code></td>
+      <td><code>Data type of an 8-byte signed integer with values from -9,223,372,036,854,775,808 to 9,223,372,036,854,775,807.</code></td>
+    </tr>
+    <tr>
+      <td><code>FLOAT</code></td>
+      <td><code>Data type of a 4-byte single precision floating point number.</code><br><br>
+          <code>Compared to the SQL standard, the type does not take parameters.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>DOUBLE</code></td>
+      <td><code>Data type of an 8-byte double precision floating point number.</code></td>
+    </tr>
+    <tr>
+      <td><code>DATE</code></td>
+      <td><code>Data type of a date consisting of year-month-day with values ranging from 0000-01-01 to 9999-12-31.</code><br><br>
+          <code>Compared to the SQL standard, the range starts at year 0000.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>TIME</code><br>
+          <code>TIME(p)</code>
+      </td>
+      <td><code>Data type of a time without time zone consisting of hour:minute:second[.fractional] with up to nanosecond precision and values ranging from 00:00:00.000000000 to 23:59:59.999999999.</code><br><br>
+          <code>The type can be declared using TIME(p) where p is the number of digits of fractional seconds (precision). p must have a value between 0 and 9 (both inclusive). If no precision is specified, p is equal to 0.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>TIMESTAMP</code><br>
+          <code>TIMESTAMP(p)</code>
+      </td>
+      <td><code>Data type of a timestamp without time zone consisting of year-month-day hour:minute:second[.fractional] with up to nanosecond precision and values ranging from 0000-01-01 00:00:00.000000000 to 9999-12-31 23:59:59.999999999.</code><br><br>
+          <code>The type can be declared using TIMESTAMP(p) where p is the number of digits of fractional seconds (precision). p must have a value between 0 and 9 (both inclusive). If no precision is specified, p is equal to 6.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>TIMESTAMP WITH TIME ZONE</code><br>
+          <code>TIMESTAMP(p) WITH TIME ZONE</code>
+      </td>
+      <td><code>Data type of a timestamp with time zone consisting of year-month-day hour:minute:second[.fractional] zone with up to nanosecond precision and values ranging from 0000-01-01 00:00:00.000000000 +14:59 to 9999-12-31 23:59:59.999999999 -14:59.</code><br><br>
+          <code>This type fills the gap between time zone free and time zone mandatory timestamp types by allowing the interpretation of UTC timestamps according to the configured session time zone. A  conversion from and to int describes the number of seconds since epoch. A conversion from and to long describes the number of milliseconds since epoch.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>ARRAY&lt;t&gt;</code></td>
+      <td><code>Data type of an array of elements with same subtype.</code><br><br>
+          <code>Compared to the SQL standard, the maximum cardinality of an array cannot be specified but is fixed at 2,147,483,647. Also, any valid type is supported as a subtype.</code><br><br>
+          <code>The type can be declared using ARRAY&lt;t&gt; where t is the data type of the contained elements.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>MAP&lt;kt, vt&gt;</code></td>
+      <td><code>Data type of an associative array that maps keys (including NULL) to values (including NULL). A map cannot contain duplicate keys; each key can map to at most one value.</code><br><br>
+          <code>There is no restriction of element types; it is the responsibility of the user to ensure uniqueness.</code><br><br>
+          <code>The type can be declared using MAP&lt;kt, vt&gt; where kt is the data type of the key elements and vt is the data type of the value elements.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>MULTISET&lt;t&gt;</code></td>
+      <td><code>Data type of a multiset (=bag). Unlike a set, it allows for multiple instances for each of its elements with a common subtype. Each unique value (including NULL) is mapped to some multiplicity.</code><br><br>
+          <code>There is no restriction of element types; it is the responsibility of the user to ensure uniqueness.</code><br><br>
+          <code>The type can be declared using MULTISET&lt;t&gt; where t is the data type of the contained elements.</code>
+      </td>
+    </tr>
+    <tr>
+      <td><code>ROW&lt;n0 t0, n1 t1, ...&gt;</code><br>
+          <code>ROW&lt;n0 t0 'd0', n1 t1 'd1', ...&gt;</code>
+      </td>
+      <td><code>Data type of a sequence of fields.</code><br><br>
+          <code>A field consists of a field name, field type, and an optional description. The most specific type of a row of a table is a row type. In this case, each column of the row corresponds to the field of the row type that has the same ordinal position as the column.</code><br><br>
+          <code>Compared to the SQL standard, an optional field description simplifies the handling with complex structures.</code><br><br>
+          <code>A row type is similar to the STRUCT type known from other non-standard-compliant frameworks.</code><br><br>
+          <code>The type can be declared using ROW&lt;n0 t0 'd0', n1 t1 'd1', ...&gt; where n is the unique name of a field, t is the logical type of a field, d is the description of a field.</code>
+      </td>
+    </tr>
+    </tbody>
+</table>
diff --git a/docs/content/concepts/spec/_index.md b/docs/content/concepts/spec/_index.md
index ef5f03098e20d..cc148d6a8b533 100644
--- a/docs/content/concepts/spec/_index.md
+++ b/docs/content/concepts/spec/_index.md
@@ -1,7 +1,7 @@
 ---
 title: Specification
 bookCollapseSection: true
-weight: 7
+weight: 8
 ---
 <!--
 Licensed to the Apache Software Foundation (ASF) under one
diff --git a/docs/layouts/shortcodes/generated/format_table_configuration.html b/docs/layouts/shortcodes/generated/format_table_configuration.html
new file mode 100644
index 0000000000000..71133d52d8e88
--- /dev/null
+++ b/docs/layouts/shortcodes/generated/format_table_configuration.html
@@ -0,0 +1,36 @@
+{{/*
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+*/}}
+<table class="configuration table table-bordered">
+    <thead>
+        <tr>
+            <th class="text-left" style="width: 20%">Key</th>
+            <th class="text-left" style="width: 15%">Default</th>
+            <th class="text-left" style="width: 10%">Type</th>
+            <th class="text-left" style="width: 55%">Description</th>
+        </tr>
+    </thead>
+    <tbody>
+        <tr>
+            <td><h5>field-delimiter</h5></td>
+            <td style="word-wrap: break-word;">","</td>
+            <td>String</td>
+            <td>Optional field delimiter character for CSV (',' by default).</td>
+        </tr>
+    </tbody>
+</table>
diff --git a/paimon-docs/src/main/java/org/apache/paimon/docs/configuration/ConfigOptionsDocGenerator.java b/paimon-docs/src/main/java/org/apache/paimon/docs/configuration/ConfigOptionsDocGenerator.java
index 6f700724ac019..1d35559af658e 100644
--- a/paimon-docs/src/main/java/org/apache/paimon/docs/configuration/ConfigOptionsDocGenerator.java
+++ b/paimon-docs/src/main/java/org/apache/paimon/docs/configuration/ConfigOptionsDocGenerator.java
@@ -77,6 +77,7 @@ public class ConfigOptionsDocGenerator {
                 new OptionsClassLocation("paimon-core", "org.apache.paimon.lookup"),
                 new OptionsClassLocation("paimon-core", "org.apache.paimon.catalog"),
                 new OptionsClassLocation("paimon-core", "org.apache.paimon.jdbc"),
+                new OptionsClassLocation("paimon-core", "org.apache.paimon.table"),
                 new OptionsClassLocation("paimon-format", "org.apache.paimon.format"),
                 new OptionsClassLocation(
                         "paimon-flink/paimon-flink-common", "org.apache.paimon.flink"),

From 11cebd43fc2bddb0fb782e1f25e3e276b808c8b7 Mon Sep 17 00:00:00 2001
From: Kerwin <37063904+zhuangchong@users.noreply.github.com>
Date: Tue, 3 Dec 2024 23:43:27 +0800
Subject: [PATCH 100/157] [hive] Add metastore.client.class option to hive
 catalog configuration document. (#4627)

---
 .../generated/hive_catalog_configuration.html         |  7 +++++++
 .../main/java/org/apache/paimon/hive/HiveCatalog.java |  2 +-
 .../org/apache/paimon/hive/HiveCatalogFactory.java    | 11 -----------
 .../org/apache/paimon/hive/HiveCatalogOptions.java    |  9 +++++++++
 4 files changed, 17 insertions(+), 12 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/hive_catalog_configuration.html b/docs/layouts/shortcodes/generated/hive_catalog_configuration.html
index e0257d301b6f0..7b6242616f359 100644
--- a/docs/layouts/shortcodes/generated/hive_catalog_configuration.html
+++ b/docs/layouts/shortcodes/generated/hive_catalog_configuration.html
@@ -65,5 +65,12 @@
 you can set this option to true.
 </td>
         </tr>
+        <tr>
+            <td><h5>metastore.client.class</h5></td>
+            <td style="word-wrap: break-word;">"org.apache.hadoop.hive.metastore.HiveMetaStoreClient"</td>
+            <td>String</td>
+            <td>Class name of Hive metastore client.
+NOTE: This class must directly implements org.apache.hadoop.hive.metastore.IMetaStoreClient.</td>
+        </tr>
     </tbody>
 </table>
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 5157e606006ca..151e2b4d2c076 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -1349,7 +1349,7 @@ public static Catalog createHiveCatalog(CatalogContext context) {
         return new HiveCatalog(
                 fileIO,
                 hiveConf,
-                options.get(HiveCatalogFactory.METASTORE_CLIENT_CLASS),
+                options.get(HiveCatalogOptions.METASTORE_CLIENT_CLASS),
                 options,
                 warehouse.toUri().toString());
     }
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogFactory.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogFactory.java
index 95da0037168c3..eff06831dd4fe 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogFactory.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogFactory.java
@@ -21,23 +21,12 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.CatalogContext;
 import org.apache.paimon.catalog.CatalogFactory;
-import org.apache.paimon.options.ConfigOption;
-import org.apache.paimon.options.ConfigOptions;
 
 import static org.apache.paimon.hive.HiveCatalogOptions.IDENTIFIER;
 
 /** Factory to create {@link HiveCatalog}. */
 public class HiveCatalogFactory implements CatalogFactory {
 
-    public static final ConfigOption<String> METASTORE_CLIENT_CLASS =
-            ConfigOptions.key("metastore.client.class")
-                    .stringType()
-                    .defaultValue("org.apache.hadoop.hive.metastore.HiveMetaStoreClient")
-                    .withDescription(
-                            "Class name of Hive metastore client.\n"
-                                    + "NOTE: This class must directly implements "
-                                    + "org.apache.hadoop.hive.metastore.IMetaStoreClient.");
-
     @Override
     public String identifier() {
         return IDENTIFIER;
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogOptions.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogOptions.java
index 38f73bc6bd65f..ceab498368205 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogOptions.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalogOptions.java
@@ -48,6 +48,15 @@ public final class HiveCatalogOptions {
                                     + "If not configured, try to load from 'HADOOP_CONF_DIR' or 'HADOOP_HOME' system environment.\n"
                                     + "Configure Priority: 1.from 'hadoop-conf-dir' 2.from HADOOP_CONF_DIR  3.from HADOOP_HOME/conf 4.HADOOP_HOME/etc/hadoop.\n");
 
+    public static final ConfigOption<String> METASTORE_CLIENT_CLASS =
+            ConfigOptions.key("metastore.client.class")
+                    .stringType()
+                    .defaultValue("org.apache.hadoop.hive.metastore.HiveMetaStoreClient")
+                    .withDescription(
+                            "Class name of Hive metastore client.\n"
+                                    + "NOTE: This class must directly implements "
+                                    + "org.apache.hadoop.hive.metastore.IMetaStoreClient.");
+
     public static final ConfigOption<Boolean> LOCATION_IN_PROPERTIES =
             ConfigOptions.key("location-in-properties")
                     .booleanType()

From 6a66908e0923de43b9c0dfa97c232bbac7ab3c92 Mon Sep 17 00:00:00 2001
From: yangjf2019 <54518670+yangjf2019@users.noreply.github.com>
Date: Wed, 4 Dec 2024 11:36:29 +0800
Subject: [PATCH 101/157] [doc] fix url positioning in documents (#4630)

---
 docs/content/flink/sql-ddl.md   | 4 ++--
 docs/content/flink/sql-write.md | 2 +-
 docs/content/spark/sql-ddl.md   | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/content/flink/sql-ddl.md b/docs/content/flink/sql-ddl.md
index 8b8c069229aae..a373348861bd0 100644
--- a/docs/content/flink/sql-ddl.md
+++ b/docs/content/flink/sql-ddl.md
@@ -101,7 +101,7 @@ Also, you can create [FlinkGenericCatalog]({{< ref "flink/quick-start" >}}).
 
 By default, Paimon does not synchronize newly created partitions into Hive metastore. Users will see an unpartitioned table in Hive. Partition push-down will be carried out by filter push-down instead.
 
-If you want to see a partitioned table in Hive and also synchronize newly created partitions into Hive metastore, please set the table property `metastore.partitioned-table` to true. Also see [CoreOptions]({{< ref "maintenance/configurations#CoreOptions" >}}).
+If you want to see a partitioned table in Hive and also synchronize newly created partitions into Hive metastore, please set the table property `metastore.partitioned-table` to true. Also see [CoreOptions]({{< ref "maintenance/configurations#coreoptions" >}}).
 
 #### Adding Parameters to a Hive Table
 
@@ -114,7 +114,7 @@ For instance, using the option `hive.table.owner=Jon` will automatically add the
 If you are using an object storage , and you don't want that the location of paimon table/database is accessed by the filesystem of hive,
 which may lead to the error such as "No FileSystem for scheme: s3a".
 You can set location in the properties of table/database by the config of `location-in-properties`. See
-[setting the location of table/database in properties ]({{< ref "maintenance/configurations#HiveCatalogOptions" >}})
+[setting the location of table/database in properties ]({{< ref "maintenance/configurations#hivecatalogoptions" >}})
 
 ### Creating JDBC Catalog
 
diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 3b6a0498eb279..60c0f5c36c529 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -79,7 +79,7 @@ The data is clustered using an automatically chosen strategy (such as ORDER, ZOR
 by setting the `sink.clustering.strategy`. Clustering relies on sampling and sorting. If the clustering process takes too much time, you can decrease
 the total sample number by setting the `sink.clustering.sample-factor` or disable the sorting step by setting the `sink.clustering.sort-in-cluster` to false.
 
-You can refer to [FlinkConnectorOptions]({{< ref "maintenance/configurations#FlinkConnectorOptions" >}}) for more info about the configurations above.
+You can refer to [FlinkConnectorOptions]({{< ref "maintenance/configurations#flinkconnectoroptions" >}}) for more info about the configurations above.
 
 ## Overwriting the Whole Table
 
diff --git a/docs/content/spark/sql-ddl.md b/docs/content/spark/sql-ddl.md
index 3b4d1722bc094..4a82d6b4a4382 100644
--- a/docs/content/spark/sql-ddl.md
+++ b/docs/content/spark/sql-ddl.md
@@ -88,7 +88,7 @@ Also, you can create [SparkGenericCatalog]({{< ref "spark/quick-start" >}}).
 
 By default, Paimon does not synchronize newly created partitions into Hive metastore. Users will see an unpartitioned table in Hive. Partition push-down will be carried out by filter push-down instead.
 
-If you want to see a partitioned table in Hive and also synchronize newly created partitions into Hive metastore, please set the table property `metastore.partitioned-table` to true. Also see [CoreOptions]({{< ref "maintenance/configurations#CoreOptions" >}}).
+If you want to see a partitioned table in Hive and also synchronize newly created partitions into Hive metastore, please set the table property `metastore.partitioned-table` to true. Also see [CoreOptions]({{< ref "maintenance/configurations#coreoptions" >}}).
 
 ### Creating JDBC Catalog
 

From c7cd8e98305bdc1331551824e57e227c65b6f4cf Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 4 Dec 2024 14:07:52 +0800
Subject: [PATCH 102/157] [avro] Fix compression not work in writer (#4628)

This closes #4628.
---
 .../migration/iceberg-compatibility.md        |  2 +-
 .../apache/paimon/iceberg/IcebergOptions.java |  2 +-
 .../iceberg/manifest/IcebergManifestFile.java |  8 ++-----
 .../iceberg/IcebergCompatibilityTest.java     | 24 ++++++++++++++-----
 .../paimon/format/avro/AvroFileFormat.java    |  2 +-
 .../format/avro/AvroFileFormatTest.java       | 12 ++++++++++
 6 files changed, 35 insertions(+), 15 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 01a03a45264dd..8e4d3c90176bd 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -373,7 +373,7 @@ you also need to set some (or all) of the following table options when creating
     </tr>
     <tr>
       <td><h5>metadata.iceberg.manifest-compression</h5></td>
-      <td style="word-wrap: break-word;">gzip</td>
+      <td style="word-wrap: break-word;">snappy</td>
       <td>String</td>
       <td>Compression for Iceberg manifest files.</td>
     </tr>
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
index 4b59e29c8c333..55fbab5158fa0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/IcebergOptions.java
@@ -74,7 +74,7 @@ public class IcebergOptions {
             key("metadata.iceberg.manifest-compression")
                     .stringType()
                     .defaultValue(
-                            "gzip") // some Iceberg reader cannot support zstd, for example DuckDB
+                            "snappy") // some Iceberg reader cannot support zstd, for example DuckDB
                     .withDescription("Compression for Iceberg manifest files.");
 
     public static final ConfigOption<Boolean> MANIFEST_LEGACY_VERSION =
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
index 57484a1f3ff92..5955da6220f87 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergManifestFile.java
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.iceberg.manifest;
 
-import org.apache.paimon.CoreOptions;
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.format.FileFormat;
 import org.apache.paimon.format.FormatReaderFactory;
@@ -111,7 +110,7 @@ public static IcebergManifestFile create(FileStoreTable table, IcebergPathFactor
     }
 
     public List<IcebergManifestFileMeta> rollingWrite(
-            Iterator<IcebergManifestEntry> entries, long sequenceNumber) throws IOException {
+            Iterator<IcebergManifestEntry> entries, long sequenceNumber) {
         RollingFileWriter<IcebergManifestEntry, IcebergManifestFileMeta> writer =
                 new RollingFileWriter<>(
                         () -> createWriter(sequenceNumber), targetFileSize.getBytes());
@@ -127,10 +126,7 @@ public List<IcebergManifestFileMeta> rollingWrite(
     public SingleFileWriter<IcebergManifestEntry, IcebergManifestFileMeta> createWriter(
             long sequenceNumber) {
         return new IcebergManifestEntryWriter(
-                writerFactory,
-                pathFactory.newPath(),
-                CoreOptions.FILE_COMPRESSION.defaultValue(),
-                sequenceNumber);
+                writerFactory, pathFactory.newPath(), compression, sequenceNumber);
     }
 
     private class IcebergManifestEntryWriter
diff --git a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
index b069ac031d38b..e5b550ff94c41 100644
--- a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
@@ -28,6 +28,7 @@
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.Timestamp;
 import org.apache.paimon.disk.IOManagerImpl;
+import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.iceberg.manifest.IcebergManifestFile;
@@ -281,9 +282,10 @@ public void testIcebergSnapshotExpire() throws Exception {
         write.write(GenericRow.of(2, 20));
         commit.commit(1, write.prepareCommit(false, 1));
         assertThat(table.snapshotManager().latestSnapshotId()).isEqualTo(1L);
+        FileIO fileIO = table.fileIO();
         IcebergMetadata metadata =
                 IcebergMetadata.fromPath(
-                        table.fileIO(), new Path(table.location(), "metadata/v1.metadata.json"));
+                        fileIO, new Path(table.location(), "metadata/v1.metadata.json"));
         assertThat(metadata.snapshots()).hasSize(1);
         assertThat(metadata.currentSnapshotId()).isEqualTo(1);
 
@@ -294,7 +296,7 @@ public void testIcebergSnapshotExpire() throws Exception {
         assertThat(table.snapshotManager().latestSnapshotId()).isEqualTo(3L);
         metadata =
                 IcebergMetadata.fromPath(
-                        table.fileIO(), new Path(table.location(), "metadata/v3.metadata.json"));
+                        fileIO, new Path(table.location(), "metadata/v3.metadata.json"));
         assertThat(metadata.snapshots()).hasSize(3);
         assertThat(metadata.currentSnapshotId()).isEqualTo(3);
 
@@ -304,15 +306,25 @@ public void testIcebergSnapshotExpire() throws Exception {
         IcebergPathFactory pathFactory =
                 new IcebergPathFactory(new Path(table.location(), "metadata"));
         IcebergManifestList manifestList = IcebergManifestList.create(table, pathFactory);
-        assertThat(manifestList.compression()).isEqualTo("gzip");
+        assertThat(manifestList.compression()).isEqualTo("snappy");
 
         IcebergManifestFile manifestFile = IcebergManifestFile.create(table, pathFactory);
-        assertThat(manifestFile.compression()).isEqualTo("gzip");
+        assertThat(manifestFile.compression()).isEqualTo("snappy");
 
         Set<String> usingManifests = new HashSet<>();
         String manifestListFile = new Path(metadata.currentSnapshot().manifestList()).getName();
+
+        assertThat(fileIO.readFileUtf8(new Path(pathFactory.metadataDirectory(), manifestListFile)))
+                .contains("snappy");
+
         for (IcebergManifestFileMeta fileMeta : manifestList.read(manifestListFile)) {
             usingManifests.add(fileMeta.manifestPath());
+            assertThat(
+                            fileIO.readFileUtf8(
+                                    new Path(
+                                            pathFactory.metadataDirectory(),
+                                            fileMeta.manifestPath())))
+                    .contains("snappy");
         }
 
         IcebergManifestList legacyManifestList =
@@ -345,7 +357,7 @@ public void testIcebergSnapshotExpire() throws Exception {
         assertThat(table.snapshotManager().latestSnapshotId()).isEqualTo(5L);
         metadata =
                 IcebergMetadata.fromPath(
-                        table.fileIO(), new Path(table.location(), "metadata/v5.metadata.json"));
+                        fileIO, new Path(table.location(), "metadata/v5.metadata.json"));
         assertThat(metadata.snapshots()).hasSize(3);
         assertThat(metadata.currentSnapshotId()).isEqualTo(5);
 
@@ -358,7 +370,7 @@ public void testIcebergSnapshotExpire() throws Exception {
         }
 
         for (String path : unusedFiles) {
-            assertThat(table.fileIO().exists(new Path(path))).isFalse();
+            assertThat(fileIO.exists(new Path(path))).isFalse();
         }
 
         // Test all existing Iceberg snapshots are valid.
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroFileFormat.java b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroFileFormat.java
index 63a51c0a13a94..fcce9ae505305 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroFileFormat.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/avro/AvroFileFormat.java
@@ -105,7 +105,7 @@ private CodecFactory createCodecFactory(String compression) {
         if (compression.equalsIgnoreCase("zstd")) {
             return CodecFactory.zstandardCodec(zstdLevel);
         }
-        return CodecFactory.fromString(options.get(AVRO_OUTPUT_CODEC));
+        return CodecFactory.fromString(compression);
     }
 
     /** A {@link FormatWriterFactory} to write {@link InternalRow}. */
diff --git a/paimon-format/src/test/java/org/apache/paimon/format/avro/AvroFileFormatTest.java b/paimon-format/src/test/java/org/apache/paimon/format/avro/AvroFileFormatTest.java
index 3f6486baaef20..9c0dbb43fe625 100644
--- a/paimon-format/src/test/java/org/apache/paimon/format/avro/AvroFileFormatTest.java
+++ b/paimon-format/src/test/java/org/apache/paimon/format/avro/AvroFileFormatTest.java
@@ -198,4 +198,16 @@ private void checkException() throws IOException {
                 .isInstanceOf(IOException.class)
                 .hasMessageContaining("Artificial exception");
     }
+
+    @Test
+    void testCompression() throws IOException {
+        RowType rowType = DataTypes.ROW(DataTypes.INT().notNull());
+        AvroFileFormat format = new AvroFileFormat(new FormatContext(new Options(), 1024, 1024));
+        LocalFileIO localFileIO = LocalFileIO.create();
+        Path file = new Path(new Path(tempPath.toUri()), UUID.randomUUID().toString());
+        try (PositionOutputStream out = localFileIO.newOutputStream(file, false)) {
+            assertThatThrownBy(() -> format.createWriterFactory(rowType).create(out, "unsupported"))
+                    .hasMessageContaining("Unrecognized codec: unsupported");
+        }
+    }
 }

From c235a4afa1455d8e0092c30999bce280d627bccf Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Wed, 4 Dec 2024 15:22:10 +0800
Subject: [PATCH 103/157] [doc] Minor refactor Python API doc (#4635)

---
 docs/content/program-api/python-api.md | 74 ++++++++++++++++----------
 1 file changed, 46 insertions(+), 28 deletions(-)

diff --git a/docs/content/program-api/python-api.md b/docs/content/program-api/python-api.md
index 86acee06d3a86..079170760b25a 100644
--- a/docs/content/program-api/python-api.md
+++ b/docs/content/program-api/python-api.md
@@ -166,6 +166,8 @@ schema = Schema(
 )
 ```
 
+See [Data Types]({{< ref "python-api#data-types" >}}) for all supported `pyarrow-to-paimon` data types mapping. 
+
 Second, if you have some Pandas data, the `pa_schema` can be extracted from `DataFrame`:
 
 ```python
@@ -217,7 +219,15 @@ table = catalog.get_table('database_name.table_name')
 
 ## Batch Read
 
-The reading is divided into Scan Plan and Read Splits stages. A `ReadBuilder` is used to create utils for these stages.
+### Set Read Parallelism
+
+TableRead interface provides parallelly reading for multiple splits. You can set `'max-workers': 'N'` in `catalog_options`
+to set thread numbers for reading splits. `max-workers` is 1 by default, that means TableRead will read splits sequentially
+if you doesn't set `max-workers`.
+
+### Get ReadBuilder and Perform pushdown
+
+A `ReadBuilder` is used to build reading utils and perform filter and projection pushdown.
 
 ```python
 table = catalog.get_table('database_name.table_name')
@@ -241,25 +251,7 @@ predicate_5 = predicate_builder.and_predicates([predicate3, predicate4])
 read_builder = read_builder.with_filter(predicate_5)
 ```
 
-
-| Predicate kind        | Predicate method                              | 
-|:----------------------|:----------------------------------------------|
-| p1 and p2             | PredicateBuilder.and_predicates([p1, p2])     |
-| p1 or p2              | PredicateBuilder.or_predicates([p1, p2])      |
-| f = literal           | PredicateBuilder.equal(f, literal)            |
-| f != literal          | PredicateBuilder.not_equal(f, literal)        |
-| f < literal           | PredicateBuilder.less_than(f, literal)        |
-| f <= literal          | PredicateBuilder.less_or_equal(f, literal)    |
-| f > literal           | PredicateBuilder.greater_than(f, literal)     |
-| f >= literal          | PredicateBuilder.greater_or_equal(f, literal) |
-| f is null             | PredicateBuilder.is_null(f)                   |
-| f is not null         | PredicateBuilder.is_not_null(f)               |
-| f.startswith(literal) | PredicateBuilder.startswith(f, literal)       |
-| f.endswith(literal)   | PredicateBuilder.endswith(f, literal)         |
-| f.contains(literal)   | PredicateBuilder.contains(f, literal)         |
-| f is in [l1, l2]      | PredicateBuilder.is_in(f, [l1, l2])           |
-| f is not in [l1, l2]  | PredicateBuilder.is_not_in(f, [l1, l2])       |
-| lower <= f <= upper   | PredicateBuilder.between(f, lower, upper)     |
+See [Predicate]({{< ref "python-api#predicate" >}}) for all supported filters and building methods.
 
 You can also pushdown projection by `ReadBuilder`:
 
@@ -268,16 +260,20 @@ You can also pushdown projection by `ReadBuilder`:
 read_builder = read_builder.with_projection(['f3', 'f2'])
 ```
 
-Then you can scan plan:
+### Scan Plan
+
+Then you can step into Scan Plan stage to get `splits`:
 
 ```python
 table_scan = read_builder.new_scan()
 splits = table_scan.splits()
 ```
 
+### Read Splits
+
 Finally, you can read data from the `splits` to various data format.
 
-### Apache Arrow
+#### Apache Arrow
 
 This requires `pyarrow` to be installed.
 
@@ -300,7 +296,7 @@ You can also read data into a `pyarrow.RecordBatchReader` and iterate record bat
 
 ```python
 table_read = read_builder.new_read()
-for batch in table_read.to_arrow_batch_reader(splits)
+for batch in table_read.to_arrow_batch_reader(splits):
     print(batch)
 
 # pyarrow.RecordBatch
@@ -311,7 +307,7 @@ for batch in table_read.to_arrow_batch_reader(splits)
 # f1: ["a","b","c"]
 ```
 
-### Pandas
+#### Pandas
 
 This requires `pandas` to be installed.
 
@@ -330,11 +326,11 @@ print(df)
 # ...
 ```
 
-### DuckDB
+#### DuckDB
 
 This requires `duckdb` to be installed.
 
-You can convert the splits into a in-memory DuckDB table and query it:
+You can convert the splits into an in-memory DuckDB table and query it:
 
 ```python
 table_read = read_builder.new_read()
@@ -353,7 +349,7 @@ print(duckdb_con.query("SELECT * FROM duckdb_table WHERE f0 = 1").fetchdf())
 # 0   1  a
 ```
 
-### Ray
+#### Ray
 
 This requires `ray` to be installed.
 
@@ -380,7 +376,7 @@ print(ray_dataset.to_pandas())
 
 ## Batch Write
 
-Paimon table write is Two-Phase Commit, you can write many times, but once committed, no more data can be write.
+Paimon table write is Two-Phase Commit, you can write many times, but once committed, no more data can be written.
 
 {{< hint warning >}}
 Currently, Python SDK doesn't support writing primary key table with `bucket=-1`.
@@ -438,3 +434,25 @@ write_builder.overwrite({'dt': '2024-01-01'})
 | pyarrow.float64()                        | DOUBLE   |
 | pyarrow.string()                         | STRING   |
 | pyarrow.boolean()                        | BOOLEAN  |
+
+## Predicate
+
+| Predicate kind        | Predicate method                              | 
+|:----------------------|:----------------------------------------------|
+| p1 and p2             | PredicateBuilder.and_predicates([p1, p2])     |
+| p1 or p2              | PredicateBuilder.or_predicates([p1, p2])      |
+| f = literal           | PredicateBuilder.equal(f, literal)            |
+| f != literal          | PredicateBuilder.not_equal(f, literal)        |
+| f < literal           | PredicateBuilder.less_than(f, literal)        |
+| f <= literal          | PredicateBuilder.less_or_equal(f, literal)    |
+| f > literal           | PredicateBuilder.greater_than(f, literal)     |
+| f >= literal          | PredicateBuilder.greater_or_equal(f, literal) |
+| f is null             | PredicateBuilder.is_null(f)                   |
+| f is not null         | PredicateBuilder.is_not_null(f)               |
+| f.startswith(literal) | PredicateBuilder.startswith(f, literal)       |
+| f.endswith(literal)   | PredicateBuilder.endswith(f, literal)         |
+| f.contains(literal)   | PredicateBuilder.contains(f, literal)         |
+| f is in [l1, l2]      | PredicateBuilder.is_in(f, [l1, l2])           |
+| f is not in [l1, l2]  | PredicateBuilder.is_not_in(f, [l1, l2])       |
+| lower <= f <= upper   | PredicateBuilder.between(f, lower, upper)     |
+

From 749535769aa730cbc6f474c59f47c0877f35cbc0 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Wed, 4 Dec 2024 15:44:47 +0800
Subject: [PATCH 104/157] [tests] Fix @Timeout annotation not working in
 PrimaryKeyFileStoreTableITCase (#4634)

---
 .../flink/PrimaryKeyFileStoreTableITCase.java | 76 +++++++++++++------
 1 file changed, 52 insertions(+), 24 deletions(-)

diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/PrimaryKeyFileStoreTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/PrimaryKeyFileStoreTableITCase.java
index 3fa95edb8682f..4ee539c4fd270 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/PrimaryKeyFileStoreTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/PrimaryKeyFileStoreTableITCase.java
@@ -59,6 +59,8 @@
 /** Tests for changelog table with primary keys. */
 public class PrimaryKeyFileStoreTableITCase extends AbstractTestBase {
 
+    private static final int TIMEOUT = 180;
+
     // ------------------------------------------------------------------------
     //  Test Utilities
     // ------------------------------------------------------------------------
@@ -95,12 +97,38 @@ private String createCatalogSql(String catalogName, String warehouse) {
                 catalogName, warehouse, defaultPropertyString);
     }
 
+    private CloseableIterator<Row> collect(TableResult result) {
+        return collect(result, TIMEOUT);
+    }
+
+    private CloseableIterator<Row> collect(TableResult result, int timeout) {
+        JobClient client = result.getJobClient().get();
+        Thread timeoutThread =
+                new Thread(
+                        () -> {
+                            for (int i = 0; i < timeout; i++) {
+                                try {
+                                    Thread.sleep(1000);
+                                    if (client.getJobStatus().get().isGloballyTerminalState()) {
+                                        return;
+                                    }
+                                } catch (Exception e) {
+                                    client.cancel();
+                                    throw new RuntimeException(e);
+                                }
+                            }
+                            client.cancel();
+                        });
+        timeoutThread.start();
+        return result.collect();
+    }
+
     // ------------------------------------------------------------------------
     //  Constructed Tests
     // ------------------------------------------------------------------------
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testFullCompactionTriggerInterval() throws Exception {
         innerTestChangelogProducing(
                 Arrays.asList(
@@ -109,7 +137,7 @@ public void testFullCompactionTriggerInterval() throws Exception {
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testFullCompactionWithLongCheckpointInterval() throws Exception {
         // create table
         TableEnvironment bEnv = tableEnvironmentBuilder().batchMode().parallelism(1).build();
@@ -135,7 +163,7 @@ public void testFullCompactionWithLongCheckpointInterval() throws Exception {
                         .build();
         sEnv.executeSql(createCatalogSql("testCatalog", path));
         sEnv.executeSql("USE CATALOG testCatalog");
-        CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM T").collect();
+        CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM T"));
 
         // run compact job
         StreamExecutionEnvironment env =
@@ -168,7 +196,7 @@ public void testFullCompactionWithLongCheckpointInterval() throws Exception {
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testLookupChangelog() throws Exception {
         innerTestChangelogProducing(Collections.singletonList("'changelog-producer' = 'lookup'"));
     }
@@ -190,7 +218,7 @@ public void testTableReadWriteBranch() throws Exception {
                         + "'bucket' = '2'"
                         + ")");
 
-        CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM T2").collect();
+        CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM T2"));
 
         // insert data
         sEnv.executeSql("INSERT INTO T2 VALUES (1, 'A')").await();
@@ -213,7 +241,7 @@ public void testTableReadWriteBranch() throws Exception {
         sEnv.executeSql("ALTER TABLE T2 SET ('changelog-producer'='full-compaction')");
 
         CloseableIterator<Row> branchIt =
-                sEnv.executeSql("select * from T2 /*+ OPTIONS('branch' = 'branch1') */").collect();
+                collect(sEnv.executeSql("select * from T2 /*+ OPTIONS('branch' = 'branch1') */"));
         // insert data to branch
         sEnv.executeSql(
                         "INSERT INTO T2/*+ OPTIONS('branch' = 'branch1') */ VALUES (10, 'v10'),(11, 'v11'),(12, 'v12')")
@@ -261,7 +289,7 @@ private void innerTestChangelogProducing(List<String> options) throws Exception
 
         sEnv.executeSql(
                 "INSERT INTO T SELECT SUM(i) AS k, g AS v FROM `default_catalog`.`default_database`.`S` GROUP BY g");
-        CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM T").collect();
+        CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM T"));
 
         // write initial data
         sEnv.executeSql(
@@ -329,7 +357,7 @@ public void testBatchJobWithConflictAndRestart() throws Exception {
         result1.await();
         result2.await();
 
-        try (CloseableIterator<Row> it = tEnv.executeSql("SELECT * FROM t").collect()) {
+        try (CloseableIterator<Row> it = collect(tEnv.executeSql("SELECT * FROM t"))) {
             for (int i = 0; i < 3; i++) {
                 assertThat(it).hasNext();
                 Row row = it.next();
@@ -338,7 +366,7 @@ public void testBatchJobWithConflictAndRestart() throws Exception {
         }
     }
 
-    @Timeout(60)
+    @Timeout(TIMEOUT)
     @ParameterizedTest()
     @ValueSource(booleans = {false, true})
     public void testRecreateTableWithException(boolean isReloadData) throws Exception {
@@ -361,7 +389,7 @@ public void testRecreateTableWithException(boolean isReloadData) throws Exceptio
                         .build();
         sEnv.executeSql(createCatalogSql("testCatalog", path + "/warehouse"));
         sEnv.executeSql("USE CATALOG testCatalog");
-        CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM t").collect();
+        CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM t"));
 
         // first write
         List<String> values = new ArrayList<>();
@@ -414,7 +442,7 @@ public void testRecreateTableWithException(boolean isReloadData) throws Exceptio
     }
 
     @Test
-    @Timeout(120)
+    @Timeout(TIMEOUT)
     public void testChangelogCompactInBatchWrite() throws Exception {
         TableEnvironment bEnv = tableEnvironmentBuilder().batchMode().build();
         String catalogDdl =
@@ -504,7 +532,7 @@ public void testChangelogCompactInBatchWrite() throws Exception {
     }
 
     @Test
-    @Timeout(120)
+    @Timeout(TIMEOUT)
     public void testChangelogCompactInStreamWrite() throws Exception {
         TableEnvironment sEnv =
                 tableEnvironmentBuilder()
@@ -533,7 +561,7 @@ public void testChangelogCompactInStreamWrite() throws Exception {
                         + "', 'source.monitor-interval' = '500ms' )");
 
         sEnv.executeSql("INSERT INTO t SELECT * FROM `default_catalog`.`default_database`.`s`");
-        CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM t").collect();
+        CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM t"));
 
         // write initial data
         List<String> values = new ArrayList<>();
@@ -589,7 +617,7 @@ private List<String> listAllFilesWithPrefix(String prefix) throws Exception {
 
     private void assertStreamingResult(TableResult result, List<Row> expected) throws Exception {
         List<Row> actual = new ArrayList<>();
-        try (CloseableIterator<Row> it = result.collect()) {
+        try (CloseableIterator<Row> it = collect(result)) {
             while (actual.size() < expected.size() && it.hasNext()) {
                 actual.add(it.next());
             }
@@ -611,14 +639,14 @@ private void assertStreamingResult(CloseableIterator<Row> it, List<Row> expected
     // ------------------------------------------------------------------------
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testNoChangelogProducerBatchRandom() throws Exception {
         TableEnvironment bEnv = tableEnvironmentBuilder().batchMode().build();
         testNoChangelogProducerRandom(bEnv, 1, false);
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testNoChangelogProducerStreamingRandom() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
         TableEnvironment sEnv =
@@ -631,14 +659,14 @@ public void testNoChangelogProducerStreamingRandom() throws Exception {
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testFullCompactionChangelogProducerBatchRandom() throws Exception {
         TableEnvironment bEnv = tableEnvironmentBuilder().batchMode().build();
         testFullCompactionChangelogProducerRandom(bEnv, 1, false);
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testFullCompactionChangelogProducerStreamingRandom() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
         TableEnvironment sEnv =
@@ -651,7 +679,7 @@ public void testFullCompactionChangelogProducerStreamingRandom() throws Exceptio
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testStandAloneFullCompactJobRandom() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
         TableEnvironment sEnv =
@@ -664,14 +692,14 @@ public void testStandAloneFullCompactJobRandom() throws Exception {
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testLookupChangelogProducerBatchRandom() throws Exception {
         TableEnvironment bEnv = tableEnvironmentBuilder().batchMode().build();
         testLookupChangelogProducerRandom(bEnv, 1, false);
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testLookupChangelogProducerStreamingRandom() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
         TableEnvironment sEnv =
@@ -684,7 +712,7 @@ public void testLookupChangelogProducerStreamingRandom() throws Exception {
     }
 
     @Test
-    @Timeout(180)
+    @Timeout(TIMEOUT)
     public void testStandAloneLookupJobRandom() throws Exception {
         ThreadLocalRandom random = ThreadLocalRandom.current();
         TableEnvironment sEnv =
@@ -868,7 +896,7 @@ private void checkChangelogTestResult(int numProducers) throws Exception {
 
         ResultChecker checker = new ResultChecker();
         int endCnt = 0;
-        try (CloseableIterator<Row> it = sEnv.executeSql("SELECT * FROM T").collect()) {
+        try (CloseableIterator<Row> it = collect(sEnv.executeSql("SELECT * FROM T"))) {
             while (it.hasNext()) {
                 Row row = it.next();
                 checker.addChangelog(row);
@@ -986,7 +1014,7 @@ private void checkBatchResult(int numProducers) throws Exception {
         bEnv.executeSql("USE CATALOG testCatalog");
 
         ResultChecker checker = new ResultChecker();
-        try (CloseableIterator<Row> it = bEnv.executeSql("SELECT * FROM T").collect()) {
+        try (CloseableIterator<Row> it = collect(bEnv.executeSql("SELECT * FROM T"))) {
             while (it.hasNext()) {
                 checker.addChangelog(it.next());
             }

From 9d641706e8e899f487e036a4346baf285e3285af Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Wed, 4 Dec 2024 15:45:55 +0800
Subject: [PATCH 105/157] [core] Support nested types in Iceberg compatible
 metadata (#4626)

---
 .../migration/iceberg-compatibility.md        |  33 +++--
 .../AbstractIcebergCommitCallback.java        |   6 +-
 .../iceberg/manifest/IcebergDataFileMeta.java |  49 +++++--
 .../iceberg/metadata/IcebergDataField.java    |  37 ++++-
 .../iceberg/metadata/IcebergListType.java     | 109 +++++++++++++++
 .../iceberg/metadata/IcebergMapType.java      | 132 ++++++++++++++++++
 .../iceberg/metadata/IcebergStructType.java   |  85 +++++++++++
 .../iceberg/IcebergCompatibilityTest.java     |  53 +++++++
 .../flink/iceberg/Flink116IcebergITCase.java  |   9 +-
 .../flink/iceberg/FlinkIcebergITCaseBase.java |  55 ++++++++
 10 files changed, 529 insertions(+), 39 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergListType.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergMapType.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergStructType.java

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 8e4d3c90176bd..8a1637d7e96e8 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -479,21 +479,24 @@ SELECT * FROM animals WHERE class = 'mammal';
 
 Paimon Iceberg compatibility currently supports the following data types.
 
-| Paimon Data Type  | Iceberg Data Type |
-|-------------------|-------------------|
-| `BOOLEAN`         | `boolean`         |
-| `INT`             | `int`             |
-| `BIGINT`          | `long`            |
-| `FLOAT`           | `float`           |
-| `DOUBLE`          | `double`          |
-| `DECIMAL`         | `decimal`         |
-| `CHAR`            | `string`          |
-| `VARCHAR`         | `string`          |
-| `BINARY`          | `binary`          |
-| `VARBINARY`       | `binary`          |
-| `DATE`            | `date`            |
-| `TIMESTAMP`*      | `timestamp`       |
-| `TIMESTAMP_LTZ`*  | `timestamptz`     |
+| Paimon Data Type | Iceberg Data Type |
+|------------------|-------------------|
+| `BOOLEAN`        | `boolean`         |
+| `INT`            | `int`             |
+| `BIGINT`         | `long`            |
+| `FLOAT`          | `float`           |
+| `DOUBLE`         | `double`          |
+| `DECIMAL`        | `decimal`         |
+| `CHAR`           | `string`          |
+| `VARCHAR`        | `string`          |
+| `BINARY`         | `binary`          |
+| `VARBINARY`      | `binary`          |
+| `DATE`           | `date`            |
+| `TIMESTAMP`*     | `timestamp`       |
+| `TIMESTAMP_LTZ`* | `timestamptz`     |
+| `ARRAY`          | `list`            |
+| `MAP`            | `map`             |
+| `ROW`            | `struct`          |
 
 *: `TIMESTAMP` and `TIMESTAMP_LTZ` type only support precision from 4 to 6
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
index 7ea6cbe05777e..f561546e8bb31 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/AbstractIcebergCommitCallback.java
@@ -295,7 +295,8 @@ private List<IcebergManifestEntry> dataSplitToManifestEntries(
                             rawFile.rowCount(),
                             rawFile.fileSize(),
                             schemaCache.get(paimonFileMeta.schemaId()),
-                            paimonFileMeta.valueStats());
+                            paimonFileMeta.valueStats(),
+                            paimonFileMeta.valueStatsCols());
             result.add(
                     new IcebergManifestEntry(
                             IcebergManifestEntry.Status.ADDED,
@@ -509,7 +510,8 @@ private List<IcebergManifestFileMeta> createNewlyAddedManifestFileMetas(
                                                     paimonFileMeta.rowCount(),
                                                     paimonFileMeta.fileSize(),
                                                     schemaCache.get(paimonFileMeta.schemaId()),
-                                                    paimonFileMeta.valueStats());
+                                                    paimonFileMeta.valueStats(),
+                                                    paimonFileMeta.valueStatsCols());
                                     return new IcebergManifestEntry(
                                             IcebergManifestEntry.Status.ADDED,
                                             currentSnapshotId,
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergDataFileMeta.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergDataFileMeta.java
index 10dbf3d237de3..d171962becad0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergDataFileMeta.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/manifest/IcebergDataFileMeta.java
@@ -22,13 +22,15 @@
 import org.apache.paimon.data.GenericMap;
 import org.apache.paimon.data.InternalMap;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.iceberg.metadata.IcebergDataField;
 import org.apache.paimon.iceberg.metadata.IcebergSchema;
 import org.apache.paimon.stats.SimpleStats;
 import org.apache.paimon.types.DataField;
-import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowType;
 
+import javax.annotation.Nullable;
+
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
@@ -110,27 +112,44 @@ public static IcebergDataFileMeta create(
             long recordCount,
             long fileSizeInBytes,
             IcebergSchema icebergSchema,
-            SimpleStats stats) {
+            SimpleStats stats,
+            @Nullable List<String> statsColumns) {
+        int numFields = icebergSchema.fields().size();
+        Map<String, Integer> indexMap = new HashMap<>();
+        if (statsColumns == null) {
+            for (int i = 0; i < numFields; i++) {
+                indexMap.put(icebergSchema.fields().get(i).name(), i);
+            }
+        } else {
+            for (int i = 0; i < statsColumns.size(); i++) {
+                indexMap.put(statsColumns.get(i), i);
+            }
+        }
+
         Map<Integer, Long> nullValueCounts = new HashMap<>();
         Map<Integer, byte[]> lowerBounds = new HashMap<>();
         Map<Integer, byte[]> upperBounds = new HashMap<>();
 
-        List<InternalRow.FieldGetter> fieldGetters = new ArrayList<>();
-        int numFields = icebergSchema.fields().size();
         for (int i = 0; i < numFields; i++) {
-            fieldGetters.add(
-                    InternalRow.createFieldGetter(icebergSchema.fields().get(i).dataType(), i));
-        }
+            IcebergDataField field = icebergSchema.fields().get(i);
+            if (!indexMap.containsKey(field.name())) {
+                continue;
+            }
 
-        for (int i = 0; i < numFields; i++) {
-            int fieldId = icebergSchema.fields().get(i).id();
-            DataType type = icebergSchema.fields().get(i).dataType();
-            nullValueCounts.put(fieldId, stats.nullCounts().getLong(i));
-            Object minValue = fieldGetters.get(i).getFieldOrNull(stats.minValues());
-            Object maxValue = fieldGetters.get(i).getFieldOrNull(stats.maxValues());
+            int idx = indexMap.get(field.name());
+            nullValueCounts.put(field.id(), stats.nullCounts().getLong(idx));
+
+            InternalRow.FieldGetter fieldGetter =
+                    InternalRow.createFieldGetter(field.dataType(), idx);
+            Object minValue = fieldGetter.getFieldOrNull(stats.minValues());
+            Object maxValue = fieldGetter.getFieldOrNull(stats.maxValues());
             if (minValue != null && maxValue != null) {
-                lowerBounds.put(fieldId, IcebergConversions.toByteBuffer(type, minValue).array());
-                upperBounds.put(fieldId, IcebergConversions.toByteBuffer(type, maxValue).array());
+                lowerBounds.put(
+                        field.id(),
+                        IcebergConversions.toByteBuffer(field.dataType(), minValue).array());
+                upperBounds.put(
+                        field.id(),
+                        IcebergConversions.toByteBuffer(field.dataType(), maxValue).array());
             }
         }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergDataField.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergDataField.java
index 93cb2ab6de239..4ecc77a13581e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergDataField.java
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergDataField.java
@@ -18,10 +18,14 @@
 
 package org.apache.paimon.iceberg.metadata;
 
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DecimalType;
 import org.apache.paimon.types.LocalZonedTimestampType;
+import org.apache.paimon.types.MapType;
+import org.apache.paimon.types.RowType;
 import org.apache.paimon.types.TimestampType;
 import org.apache.paimon.utils.Preconditions;
 
@@ -32,6 +36,7 @@
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
 import java.util.Objects;
+import java.util.stream.Collectors;
 
 /**
  * {@link DataField} in Iceberg.
@@ -57,7 +62,7 @@ public class IcebergDataField {
     private final boolean required;
 
     @JsonProperty(FIELD_TYPE)
-    private final String type;
+    private final Object type;
 
     @JsonIgnore private final DataType dataType;
 
@@ -69,7 +74,7 @@ public IcebergDataField(DataField dataField) {
                 dataField.id(),
                 dataField.name(),
                 !dataField.type().isNullable(),
-                toTypeString(dataField.type()),
+                toTypeObject(dataField.type(), dataField.id(), 0),
                 dataField.type(),
                 dataField.description());
     }
@@ -79,13 +84,13 @@ public IcebergDataField(
             @JsonProperty(FIELD_ID) int id,
             @JsonProperty(FIELD_NAME) String name,
             @JsonProperty(FIELD_REQUIRED) boolean required,
-            @JsonProperty(FIELD_TYPE) String type,
+            @JsonProperty(FIELD_TYPE) Object type,
             @JsonProperty(FIELD_DOC) String doc) {
         this(id, name, required, type, null, doc);
     }
 
     public IcebergDataField(
-            int id, String name, boolean required, String type, DataType dataType, String doc) {
+            int id, String name, boolean required, Object type, DataType dataType, String doc) {
         this.id = id;
         this.name = name;
         this.required = required;
@@ -110,7 +115,7 @@ public boolean required() {
     }
 
     @JsonGetter(FIELD_TYPE)
-    public String type() {
+    public Object type() {
         return type;
     }
 
@@ -124,7 +129,7 @@ public DataType dataType() {
         return Preconditions.checkNotNull(dataType);
     }
 
-    private static String toTypeString(DataType dataType) {
+    private static Object toTypeObject(DataType dataType, int fieldId, int depth) {
         switch (dataType.getTypeRoot()) {
             case BOOLEAN:
                 return "boolean";
@@ -160,6 +165,26 @@ private static String toTypeString(DataType dataType) {
                         timestampLtzPrecision > 3 && timestampLtzPrecision <= 6,
                         "Paimon Iceberg compatibility only support timestamp type with precision from 4 to 6.");
                 return "timestamptz";
+            case ARRAY:
+                ArrayType arrayType = (ArrayType) dataType;
+                return new IcebergListType(
+                        SpecialFields.getArrayElementFieldId(fieldId, depth + 1),
+                        !dataType.isNullable(),
+                        toTypeObject(arrayType.getElementType(), fieldId, depth + 1));
+            case MAP:
+                MapType mapType = (MapType) dataType;
+                return new IcebergMapType(
+                        SpecialFields.getMapKeyFieldId(fieldId, depth + 1),
+                        toTypeObject(mapType.getKeyType(), fieldId, depth + 1),
+                        SpecialFields.getMapValueFieldId(fieldId, depth + 1),
+                        !mapType.getValueType().isNullable(),
+                        toTypeObject(mapType.getValueType(), fieldId, depth + 1));
+            case ROW:
+                RowType rowType = (RowType) dataType;
+                return new IcebergStructType(
+                        rowType.getFields().stream()
+                                .map(IcebergDataField::new)
+                                .collect(Collectors.toList()));
             default:
                 throw new UnsupportedOperationException("Unsupported data type: " + dataType);
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergListType.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergListType.java
new file mode 100644
index 0000000000000..d25ead64fcb5a
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergListType.java
@@ -0,0 +1,109 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.iceberg.metadata;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Objects;
+
+/**
+ * {@link org.apache.paimon.types.ArrayType} in Iceberg.
+ *
+ * <p>See <a href="https://iceberg.apache.org/spec/#schemas">Iceberg spec</a>.
+ */
+@JsonIgnoreProperties(ignoreUnknown = true)
+public class IcebergListType {
+
+    private static final String FIELD_TYPE = "type";
+    private static final String FIELD_ELEMENT_ID = "element-id";
+    private static final String FIELD_ELEMENT_REQUIRED = "element-required";
+    private static final String FIELD_ELEMENT = "element";
+
+    @JsonProperty(FIELD_TYPE)
+    private final String type;
+
+    @JsonProperty(FIELD_ELEMENT_ID)
+    private final int elementId;
+
+    @JsonProperty(FIELD_ELEMENT_REQUIRED)
+    private final boolean elementRequired;
+
+    @JsonProperty(FIELD_ELEMENT)
+    private final Object element;
+
+    public IcebergListType(int elementId, boolean elementRequired, Object element) {
+        this("list", elementId, elementRequired, element);
+    }
+
+    @JsonCreator
+    public IcebergListType(
+            @JsonProperty(FIELD_TYPE) String type,
+            @JsonProperty(FIELD_ELEMENT_ID) int elementId,
+            @JsonProperty(FIELD_ELEMENT_REQUIRED) boolean elementRequired,
+            @JsonProperty(FIELD_ELEMENT) Object element) {
+        this.type = type;
+        this.elementId = elementId;
+        this.elementRequired = elementRequired;
+        this.element = element;
+    }
+
+    @JsonGetter(FIELD_TYPE)
+    public String type() {
+        return type;
+    }
+
+    @JsonGetter(FIELD_ELEMENT_ID)
+    public int elementId() {
+        return elementId;
+    }
+
+    @JsonGetter(FIELD_ELEMENT_REQUIRED)
+    public boolean elementRequired() {
+        return elementRequired;
+    }
+
+    @JsonGetter(FIELD_ELEMENT)
+    public Object element() {
+        return element;
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(type, elementId, elementRequired, element);
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (!(o instanceof IcebergListType)) {
+            return false;
+        }
+
+        IcebergListType that = (IcebergListType) o;
+        return Objects.equals(type, that.type)
+                && elementId == that.elementId
+                && elementRequired == that.elementRequired
+                && Objects.equals(element, that.element);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergMapType.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergMapType.java
new file mode 100644
index 0000000000000..81a3a04b1f413
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergMapType.java
@@ -0,0 +1,132 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.iceberg.metadata;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Objects;
+
+/**
+ * {@link org.apache.paimon.types.MapType} in Iceberg.
+ *
+ * <p>See <a href="https://iceberg.apache.org/spec/#schemas">Iceberg spec</a>.
+ */
+@JsonIgnoreProperties(ignoreUnknown = true)
+public class IcebergMapType {
+
+    private static final String FIELD_TYPE = "type";
+    private static final String FIELD_KEY_ID = "key-id";
+    private static final String FIELD_KEY = "key";
+    private static final String FIELD_VALUE_ID = "value-id";
+    private static final String FIELD_VALUE_REQUIRED = "value-required";
+    private static final String FIELD_VALUE = "value";
+
+    @JsonProperty(FIELD_TYPE)
+    private final String type;
+
+    @JsonProperty(FIELD_KEY_ID)
+    private final int keyId;
+
+    @JsonProperty(FIELD_KEY)
+    private final Object key;
+
+    @JsonProperty(FIELD_VALUE_ID)
+    private final int valueId;
+
+    @JsonProperty(FIELD_VALUE_REQUIRED)
+    private final boolean valueRequired;
+
+    @JsonProperty(FIELD_VALUE)
+    private final Object value;
+
+    public IcebergMapType(int keyId, Object key, int valueId, boolean valueRequired, Object value) {
+        this("map", keyId, key, valueId, valueRequired, value);
+    }
+
+    @JsonCreator
+    public IcebergMapType(
+            @JsonProperty(FIELD_TYPE) String type,
+            @JsonProperty(FIELD_KEY_ID) int keyId,
+            @JsonProperty(FIELD_KEY) Object key,
+            @JsonProperty(FIELD_VALUE_ID) int valueId,
+            @JsonProperty(FIELD_VALUE_REQUIRED) boolean valueRequired,
+            @JsonProperty(FIELD_VALUE) Object value) {
+        this.type = type;
+        this.keyId = keyId;
+        this.key = key;
+        this.valueId = valueId;
+        this.valueRequired = valueRequired;
+        this.value = value;
+    }
+
+    @JsonGetter(FIELD_TYPE)
+    public String type() {
+        return type;
+    }
+
+    @JsonGetter(FIELD_KEY_ID)
+    public int keyId() {
+        return keyId;
+    }
+
+    @JsonGetter(FIELD_KEY)
+    public Object key() {
+        return key;
+    }
+
+    @JsonGetter(FIELD_VALUE_ID)
+    public int valueId() {
+        return valueId;
+    }
+
+    @JsonGetter(FIELD_VALUE_REQUIRED)
+    public boolean valueRequired() {
+        return valueRequired;
+    }
+
+    @JsonGetter(FIELD_VALUE)
+    public Object value() {
+        return value;
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(type, keyId, key, valueId, valueRequired, value);
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (!(o instanceof IcebergMapType)) {
+            return false;
+        }
+        IcebergMapType that = (IcebergMapType) o;
+        return Objects.equals(type, that.type)
+                && keyId == that.keyId
+                && Objects.equals(key, that.key)
+                && valueId == that.valueId
+                && valueRequired == that.valueRequired
+                && Objects.equals(value, that.value);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergStructType.java b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergStructType.java
new file mode 100644
index 0000000000000..84b0d430e4385
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/iceberg/metadata/IcebergStructType.java
@@ -0,0 +1,85 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.iceberg.metadata;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.List;
+import java.util.Objects;
+
+/**
+ * {@link org.apache.paimon.types.RowType} in Iceberg.
+ *
+ * <p>See <a href="https://iceberg.apache.org/spec/#schemas">Iceberg spec</a>.
+ */
+@JsonIgnoreProperties(ignoreUnknown = true)
+public class IcebergStructType {
+
+    private static final String FIELD_TYPE = "type";
+    private static final String FIELD_FIELDS = "fields";
+
+    @JsonProperty(FIELD_TYPE)
+    private final String type;
+
+    @JsonProperty(FIELD_FIELDS)
+    private final List<IcebergDataField> fields;
+
+    public IcebergStructType(List<IcebergDataField> fields) {
+        this("struct", fields);
+    }
+
+    @JsonCreator
+    public IcebergStructType(
+            @JsonProperty(FIELD_TYPE) String type,
+            @JsonProperty(FIELD_FIELDS) List<IcebergDataField> fields) {
+        this.type = type;
+        this.fields = fields;
+    }
+
+    @JsonGetter(FIELD_TYPE)
+    public String type() {
+        return type;
+    }
+
+    @JsonGetter(FIELD_FIELDS)
+    public List<IcebergDataField> fields() {
+        return fields;
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(type, fields);
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (!(o instanceof IcebergStructType)) {
+            return false;
+        }
+
+        IcebergStructType that = (IcebergStructType) o;
+        return Objects.equals(type, that.type) && Objects.equals(fields, that.fields);
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
index e5b550ff94c41..7258a1dd4170c 100644
--- a/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/iceberg/IcebergCompatibilityTest.java
@@ -25,6 +25,8 @@
 import org.apache.paimon.data.BinaryRowWriter;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.Decimal;
+import org.apache.paimon.data.GenericArray;
+import org.apache.paimon.data.GenericMap;
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.Timestamp;
 import org.apache.paimon.disk.IOManagerImpl;
@@ -44,6 +46,7 @@
 import org.apache.paimon.table.sink.CommitMessage;
 import org.apache.paimon.table.sink.TableCommitImpl;
 import org.apache.paimon.table.sink.TableWriteImpl;
+import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
 import org.apache.paimon.types.DataTypeRoot;
 import org.apache.paimon.types.DataTypes;
@@ -542,6 +545,56 @@ public void testAllTypeStatistics() throws Exception {
         }
     }
 
+    @Test
+    public void testNestedTypes() throws Exception {
+        RowType innerType =
+                RowType.of(
+                        new DataField(2, "f1", DataTypes.STRING()),
+                        new DataField(3, "f2", DataTypes.INT()));
+        RowType rowType =
+                RowType.of(
+                        new DataField(0, "k", DataTypes.INT()),
+                        new DataField(
+                                1,
+                                "v",
+                                DataTypes.MAP(DataTypes.INT(), DataTypes.ARRAY(innerType))));
+        FileStoreTable table =
+                createPaimonTable(rowType, Collections.emptyList(), Collections.emptyList(), -1);
+
+        String commitUser = UUID.randomUUID().toString();
+        TableWriteImpl<?> write = table.newWrite(commitUser);
+        TableCommitImpl commit = table.newCommit(commitUser);
+
+        Map<Integer, GenericArray> map1 = new HashMap<>();
+        map1.put(
+                10,
+                new GenericArray(
+                        new GenericRow[] {
+                            GenericRow.of(BinaryString.fromString("apple"), 100),
+                            GenericRow.of(BinaryString.fromString("banana"), 101)
+                        }));
+        write.write(GenericRow.of(1, new GenericMap(map1)));
+
+        Map<Integer, GenericArray> map2 = new HashMap<>();
+        map2.put(
+                20,
+                new GenericArray(
+                        new GenericRow[] {
+                            GenericRow.of(BinaryString.fromString("cherry"), 200),
+                            GenericRow.of(BinaryString.fromString("pear"), 201)
+                        }));
+        write.write(GenericRow.of(2, new GenericMap(map2)));
+
+        commit.commit(1, write.prepareCommit(false, 1));
+        write.close();
+        commit.close();
+
+        assertThat(getIcebergResult())
+                .containsExactlyInAnyOrder(
+                        "Record(1, {10=[Record(apple, 100), Record(banana, 101)]})",
+                        "Record(2, {20=[Record(cherry, 200), Record(pear, 201)]})");
+    }
+
     // ------------------------------------------------------------------------
     //  Random Tests
     // ------------------------------------------------------------------------
diff --git a/paimon-flink/paimon-flink-1.16/src/test/java/org/apache/paimon/flink/iceberg/Flink116IcebergITCase.java b/paimon-flink/paimon-flink-1.16/src/test/java/org/apache/paimon/flink/iceberg/Flink116IcebergITCase.java
index 0097700c70fad..3001fefe4bb3b 100644
--- a/paimon-flink/paimon-flink-1.16/src/test/java/org/apache/paimon/flink/iceberg/Flink116IcebergITCase.java
+++ b/paimon-flink/paimon-flink-1.16/src/test/java/org/apache/paimon/flink/iceberg/Flink116IcebergITCase.java
@@ -19,4 +19,11 @@
 package org.apache.paimon.flink.iceberg;
 
 /** IT cases for Paimon Iceberg compatibility in Flink 1.16. */
-public class Flink116IcebergITCase extends FlinkIcebergITCaseBase {}
+public class Flink116IcebergITCase extends FlinkIcebergITCaseBase {
+
+    @Override
+    public void testNestedTypes(String format) {
+        // Flink 1.16 (or maybe Calcite?) will mistakenly cast the result to VARCHAR(5),
+        // so we skip this test in Flink 1.16.
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/iceberg/FlinkIcebergITCaseBase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/iceberg/FlinkIcebergITCaseBase.java
index 413a404c41ed2..9202cfb8fefb4 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/iceberg/FlinkIcebergITCaseBase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/iceberg/FlinkIcebergITCaseBase.java
@@ -404,6 +404,61 @@ public void testDropAndRecreateTable(String format) throws Exception {
                 .containsExactlyInAnyOrder(Row.of("munich"), Row.of("cologne"));
     }
 
+    @ParameterizedTest
+    @ValueSource(strings = {"orc", "parquet", "avro"})
+    public void testNestedTypes(String format) throws Exception {
+        String warehouse = getTempDirPath();
+        TableEnvironment tEnv = tableEnvironmentBuilder().batchMode().parallelism(2).build();
+        tEnv.executeSql(
+                "CREATE CATALOG paimon WITH (\n"
+                        + "  'type' = 'paimon',\n"
+                        + "  'warehouse' = '"
+                        + warehouse
+                        + "'\n"
+                        + ")");
+        tEnv.executeSql(
+                "CREATE TABLE paimon.`default`.T (\n"
+                        + "  k INT,\n"
+                        + "  v MAP<INT, ARRAY<ROW(f1 STRING, f2 INT)>>,\n"
+                        + "  v2 BIGINT\n"
+                        + ") WITH (\n"
+                        + "  'metadata.iceberg.storage' = 'hadoop-catalog',\n"
+                        + "  'file.format' = '"
+                        + format
+                        + "'\n"
+                        + ")");
+        tEnv.executeSql(
+                        "INSERT INTO paimon.`default`.T VALUES "
+                                + "(1, MAP[10, ARRAY[ROW('apple', 100), ROW('banana', 101)], 20, ARRAY[ROW('cat', 102), ROW('dog', 103)]], 1000), "
+                                + "(2, MAP[10, ARRAY[ROW('cherry', 200), ROW('pear', 201)], 20, ARRAY[ROW('tiger', 202), ROW('wolf', 203)]], 2000)")
+                .await();
+
+        tEnv.executeSql(
+                "CREATE CATALOG iceberg WITH (\n"
+                        + "  'type' = 'iceberg',\n"
+                        + "  'catalog-type' = 'hadoop',\n"
+                        + "  'warehouse' = '"
+                        + warehouse
+                        + "/iceberg',\n"
+                        + "  'cache-enabled' = 'false'\n"
+                        + ")");
+        assertThat(collect(tEnv.executeSql("SELECT k, v[10], v2 FROM iceberg.`default`.T")))
+                .containsExactlyInAnyOrder(
+                        Row.of(1, new Row[] {Row.of("apple", 100), Row.of("banana", 101)}, 1000L),
+                        Row.of(2, new Row[] {Row.of("cherry", 200), Row.of("pear", 201)}, 2000L));
+
+        tEnv.executeSql(
+                        "INSERT INTO paimon.`default`.T VALUES "
+                                + "(3, MAP[10, ARRAY[ROW('mango', 300), ROW('watermelon', 301)], 20, ARRAY[ROW('rabbit', 302), ROW('lion', 303)]], 3000)")
+                .await();
+        assertThat(
+                        collect(
+                                tEnv.executeSql(
+                                        "SELECT k, v[10][2].f1, v2 FROM iceberg.`default`.T WHERE v[20][1].f2 > 200")))
+                .containsExactlyInAnyOrder(
+                        Row.of(2, "pear", 2000L), Row.of(3, "watermelon", 3000L));
+    }
+
     private List<Row> collect(TableResult result) throws Exception {
         List<Row> rows = new ArrayList<>();
         try (CloseableIterator<Row> it = result.collect()) {

From 2e2a214985f4eef3bda4c7505ec53be1ec278974 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 4 Dec 2024 16:20:01 +0800
Subject: [PATCH 106/157] [core] Drop stats for deleted data files to reduce
 memory (#4629)

---
 ...nawareAppendTableCompactionCoordinator.java |  2 ++
 .../operation/AbstractFileStoreWrite.java      |  3 ++-
 .../paimon/stats/SimpleStatsEvolution.java     | 18 +++++++++++++++---
 .../flink/lookup/LookupDataTableScan.java      |  1 +
 .../lookup/PrimaryKeyPartialLookupTable.java   |  1 +
 .../paimon/flink/service/QueryFileMonitor.java |  2 +-
 .../paimon/spark/commands/PaimonCommand.scala  |  3 ++-
 7 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
index 577f28d0f5cff..5e43568aac3f1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
+++ b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
@@ -380,6 +380,8 @@ public FilesIterator(
             if (filter != null) {
                 snapshotReader.withFilter(filter);
             }
+            // drop stats to reduce memory
+            snapshotReader.dropStats();
             this.streamingMode = isStreaming;
         }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
index d63887030090e..43957de8d6c14 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
@@ -101,7 +101,8 @@ protected AbstractFileStoreWrite(
             int writerNumberMax,
             boolean legacyPartitionName) {
         this.snapshotManager = snapshotManager;
-        this.scan = scan;
+        // Statistic is useless in writer
+        this.scan = scan == null ? null : scan.dropStats();
         this.indexFactory = indexFactory;
         this.dvMaintainerFactory = dvMaintainerFactory;
         this.totalBuckets = totalBuckets;
diff --git a/paimon-core/src/main/java/org/apache/paimon/stats/SimpleStatsEvolution.java b/paimon-core/src/main/java/org/apache/paimon/stats/SimpleStatsEvolution.java
index d3f6d4cd62af6..079300a89dd2a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/stats/SimpleStatsEvolution.java
+++ b/paimon-core/src/main/java/org/apache/paimon/stats/SimpleStatsEvolution.java
@@ -22,6 +22,8 @@
 import org.apache.paimon.casting.CastedRow;
 import org.apache.paimon.data.BinaryString;
 import org.apache.paimon.data.Decimal;
+import org.apache.paimon.data.GenericArray;
+import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalArray;
 import org.apache.paimon.data.InternalMap;
 import org.apache.paimon.data.InternalRow;
@@ -33,9 +35,9 @@
 
 import javax.annotation.Nullable;
 
-import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.concurrent.ConcurrentHashMap;
 
 /** Converter for array of {@link SimpleColStats}. */
 public class SimpleStatsEvolution {
@@ -46,6 +48,9 @@ public class SimpleStatsEvolution {
 
     private final Map<List<String>, int[]> indexMappings;
 
+    private final GenericRow emptyValues;
+    private final GenericArray emptyNullCounts;
+
     public SimpleStatsEvolution(
             RowType rowType,
             @Nullable int[] indexMapping,
@@ -53,7 +58,9 @@ public SimpleStatsEvolution(
         this.fieldNames = rowType.getFieldNames();
         this.indexMapping = indexMapping;
         this.castFieldGetters = castFieldGetters;
-        this.indexMappings = new HashMap<>();
+        this.indexMappings = new ConcurrentHashMap<>();
+        this.emptyValues = new GenericRow(fieldNames.size());
+        this.emptyNullCounts = new GenericArray(new Object[fieldNames.size()]);
     }
 
     public Result evolution(
@@ -62,7 +69,12 @@ public Result evolution(
         InternalRow maxValues = stats.maxValues();
         InternalArray nullCounts = stats.nullCounts();
 
-        if (denseFields != null) {
+        if (denseFields != null && denseFields.isEmpty()) {
+            // optimize for empty dense fields
+            minValues = emptyValues;
+            maxValues = emptyValues;
+            nullCounts = emptyNullCounts;
+        } else if (denseFields != null) {
             int[] denseIndexMapping =
                     indexMappings.computeIfAbsent(
                             denseFields,
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
index 48cb64e70be17..f43d80321ecc9 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/LookupDataTableScan.java
@@ -59,6 +59,7 @@ public LookupDataTableScan(
                 defaultValueAssigner);
         this.startupMode = options.startupMode();
         this.lookupScanMode = lookupScanMode;
+        dropStats();
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/PrimaryKeyPartialLookupTable.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/PrimaryKeyPartialLookupTable.java
index ef5543ac9b7cf..7bd7a652b56e4 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/PrimaryKeyPartialLookupTable.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/lookup/PrimaryKeyPartialLookupTable.java
@@ -207,6 +207,7 @@ private LocalQueryExecutor(
 
             this.scan =
                     table.newReadBuilder()
+                            .dropStats()
                             .withFilter(filter)
                             .withBucketFilter(
                                     requireCachedBucketIds == null
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
index 02f8a654112ea..b9776786fa571 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
@@ -83,7 +83,7 @@ public void open(OpenContext openContext) throws Exception {
      */
     public void open(Configuration parameters) throws Exception {
         FileMonitorTable monitorTable = new FileMonitorTable((FileStoreTable) table);
-        ReadBuilder readBuilder = monitorTable.newReadBuilder();
+        ReadBuilder readBuilder = monitorTable.newReadBuilder().dropStats();
         this.scan = readBuilder.newStreamScan();
         this.read = readBuilder.newRead();
     }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
index 191d7a766b716..466643b157097 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
@@ -94,7 +94,8 @@ trait PaimonCommand extends WithFileStoreTable with ExpressionHelper with SQLCon
       condition: Expression,
       output: Seq[Attribute]): Seq[DataSplit] = {
     // low level snapshot reader, it can not be affected by 'scan.mode'
-    val snapshotReader = table.newSnapshotReader()
+    // dropStats after filter push down
+    val snapshotReader = table.newSnapshotReader().dropStats()
     if (condition != TrueLiteral) {
       val filter =
         convertConditionToPaimonPredicate(condition, output, rowType, ignoreFailure = true)

From 05e3e6281e2ae2b60f55d0a148605b1315bc7051 Mon Sep 17 00:00:00 2001
From: tsreaper <tsreaper96@gmail.com>
Date: Wed, 4 Dec 2024 17:17:28 +0800
Subject: [PATCH 107/157] [e2e] Try to fix e2e tests timeout by updating kafka
 docker version (#4637)

---
 .../src/test/java/org/apache/paimon/tests/E2eTestBase.java    | 3 ++-
 .../src/test/resources-filtered/docker-compose.yaml           | 4 ++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/paimon-e2e-tests/src/test/java/org/apache/paimon/tests/E2eTestBase.java b/paimon-e2e-tests/src/test/java/org/apache/paimon/tests/E2eTestBase.java
index 55f9e984e5de3..0547ac4f27d1f 100644
--- a/paimon-e2e-tests/src/test/java/org/apache/paimon/tests/E2eTestBase.java
+++ b/paimon-e2e-tests/src/test/java/org/apache/paimon/tests/E2eTestBase.java
@@ -111,7 +111,8 @@ public void before() throws Exception {
             for (String s : kafkaServices) {
                 environment.withLogConsumer(s + "-1", new Slf4jLogConsumer(LOG));
             }
-            environment.waitingFor("kafka-1", buildWaitStrategy(".*Recorded new controller.*", 2));
+            environment.waitingFor(
+                    "kafka-1", buildWaitStrategy(".*Recorded new ZK controller.*", 2));
         }
         if (withHive) {
             List<String> hiveServices =
diff --git a/paimon-e2e-tests/src/test/resources-filtered/docker-compose.yaml b/paimon-e2e-tests/src/test/resources-filtered/docker-compose.yaml
index 80d4a51fb1b52..b89420c8125a4 100644
--- a/paimon-e2e-tests/src/test/resources-filtered/docker-compose.yaml
+++ b/paimon-e2e-tests/src/test/resources-filtered/docker-compose.yaml
@@ -77,7 +77,7 @@ services:
   # ----------------------------------------
 
   zookeeper:
-    image: confluentinc/cp-zookeeper:7.0.1
+    image: confluentinc/cp-zookeeper:7.8.0
     networks:
       testnetwork:
         aliases:
@@ -89,7 +89,7 @@ services:
       - "2181"
 
   kafka:
-    image: confluentinc/cp-kafka:7.0.1
+    image: confluentinc/cp-kafka:7.8.0
     networks:
       testnetwork:
         aliases:

From 1b694d533389a7d4a620f60d1d768c7f46a90b46 Mon Sep 17 00:00:00 2001
From: Tan-JiaLiang <tanjialiang1997@gmail.com>
Date: Wed, 4 Dec 2024 17:24:01 +0800
Subject: [PATCH 108/157] [core] Use min/max to fast skip the bsi index
 comparison (#4631)

---
 docs/content/concepts/spec/fileindex.md       |  28 ++-
 .../utils/BitSliceIndexRoaringBitmap.java     | 112 ++++++++-
 .../utils/BitSliceIndexRoaringBitmapTest.java | 230 ++++++++++++++----
 3 files changed, 315 insertions(+), 55 deletions(-)

diff --git a/docs/content/concepts/spec/fileindex.md b/docs/content/concepts/spec/fileindex.md
index fd499fdf760d4..7134e021f71ae 100644
--- a/docs/content/concepts/spec/fileindex.md
+++ b/docs/content/concepts/spec/fileindex.md
@@ -154,11 +154,35 @@ BSI file index format (V1)
 +-------------------------------------------------+
 ｜ has positive value (1 byte)                    ｜
 +-------------------------------------------------+
-｜ positive bsi serialized (if has positive value)｜       
+｜ positive BSI serialized (if has positive value)｜       
 +-------------------------------------------------+
 ｜ has negative value (1 byte)                    ｜
 +-------------------------------------------------+
-｜ negative bsi serialized (if has negative value)｜       
+｜ negative BSI serialized (if has negative value)｜       
++-------------------------------------------------+
+</pre>
+
+BSI serialized format (V1):
+<pre>
+BSI serialized format (V1)
++-------------------------------------------------+
+｜ version (1 byte)                               ｜
++-------------------------------------------------+
+｜ min value (8 bytes long)                       ｜
++-------------------------------------------------+
+｜ max value (8 bytes long)                       ｜
++-------------------------------------------------+
+｜ serialized existence bitmap                    ｜       
++-------------------------------------------------+
+｜ bit slice bitmap count (4 bytes int)           ｜
++-------------------------------------------------+
+｜ serialized bit 0 bitmap                        ｜
++-------------------------------------------------+
+｜ serialized bit 1 bitmap                        ｜
++-------------------------------------------------+
+｜ serialized bit 2 bitmap                        ｜
++-------------------------------------------------+
+｜ ...                                            ｜
 +-------------------------------------------------+
 </pre>
 
diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmap.java b/paimon-common/src/main/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmap.java
index 662d791d12325..c2dcf58e85ada 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmap.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmap.java
@@ -18,11 +18,15 @@
 
 package org.apache.paimon.utils;
 
+import org.apache.paimon.annotation.VisibleForTesting;
+
 import java.io.DataInput;
 import java.io.DataOutput;
 import java.io.IOException;
 import java.util.Arrays;
 import java.util.Objects;
+import java.util.Optional;
+import java.util.function.Supplier;
 
 /* This file is based on source code from the RoaringBitmap Project (http://roaringbitmap.org/), licensed by the Apache
  * Software Foundation (ASF) under the Apache License, Version 2.0. See the NOTICE file distributed with this work for
@@ -34,36 +38,39 @@ public class BitSliceIndexRoaringBitmap {
     public static final byte VERSION_1 = 1;
 
     public static final BitSliceIndexRoaringBitmap EMPTY =
-            new BitSliceIndexRoaringBitmap(0, new RoaringBitmap32(), new RoaringBitmap32[] {});
+            new BitSliceIndexRoaringBitmap(0, 0, new RoaringBitmap32(), new RoaringBitmap32[] {});
 
     private final long min;
+    private final long max;
     private final RoaringBitmap32 ebm;
     private final RoaringBitmap32[] slices;
 
-    private BitSliceIndexRoaringBitmap(long min, RoaringBitmap32 ebm, RoaringBitmap32[] slices) {
+    private BitSliceIndexRoaringBitmap(
+            long min, long max, RoaringBitmap32 ebm, RoaringBitmap32[] slices) {
         this.min = min;
+        this.max = max;
         this.ebm = ebm;
         this.slices = slices;
     }
 
     public RoaringBitmap32 eq(long predicate) {
-        return oNeilCompare(Operation.EQ, predicate - min, null);
+        return compare(Operation.EQ, predicate, null);
     }
 
     public RoaringBitmap32 lt(long predicate) {
-        return oNeilCompare(Operation.LT, predicate - min, null);
+        return compare(Operation.LT, predicate, null);
     }
 
     public RoaringBitmap32 lte(long predicate) {
-        return oNeilCompare(Operation.LTE, predicate - min, null);
+        return compare(Operation.LTE, predicate, null);
     }
 
     public RoaringBitmap32 gt(long predicate) {
-        return oNeilCompare(Operation.GT, predicate - min, null);
+        return compare(Operation.GT, predicate, null);
     }
 
     public RoaringBitmap32 gte(long predicate) {
-        return oNeilCompare(Operation.GTE, predicate - min, null);
+        return compare(Operation.GTE, predicate, null);
     }
 
     public RoaringBitmap32 isNotNull() {
@@ -84,6 +91,86 @@ public boolean equals(Object o) {
                 && Arrays.equals(slices, that.slices);
     }
 
+    private RoaringBitmap32 compare(Operation operation, long predicate, RoaringBitmap32 foundSet) {
+        // using min/max to fast skip
+        return compareUsingMinMax(operation, predicate, foundSet)
+                .orElseGet(() -> oNeilCompare(operation, predicate - min, foundSet));
+    }
+
+    @VisibleForTesting
+    protected Optional<RoaringBitmap32> compareUsingMinMax(
+            Operation operation, long predicate, RoaringBitmap32 foundSet) {
+        Supplier<Optional<RoaringBitmap32>> empty = () -> Optional.of(new RoaringBitmap32());
+        Supplier<Optional<RoaringBitmap32>> all =
+                () -> {
+                    if (foundSet == null) {
+                        return Optional.of(isNotNull());
+                    } else {
+                        return Optional.of(RoaringBitmap32.and(foundSet, ebm));
+                    }
+                };
+
+        switch (operation) {
+            case EQ:
+                {
+                    if (min == max && min == predicate) {
+                        return all.get();
+                    } else if (predicate < min || predicate > max) {
+                        return empty.get();
+                    }
+                    break;
+                }
+            case NEQ:
+                {
+                    if (min == max && min == predicate) {
+                        return empty.get();
+                    } else if (predicate < min || predicate > max) {
+                        return all.get();
+                    }
+                    break;
+                }
+            case GTE:
+                {
+                    if (predicate <= min) {
+                        return all.get();
+                    } else if (predicate > max) {
+                        return empty.get();
+                    }
+                    break;
+                }
+            case GT:
+                {
+                    if (predicate < min) {
+                        return all.get();
+                    } else if (predicate >= max) {
+                        return empty.get();
+                    }
+                    break;
+                }
+            case LTE:
+                {
+                    if (predicate >= max) {
+                        return all.get();
+                    } else if (predicate < min) {
+                        return empty.get();
+                    }
+                    break;
+                }
+            case LT:
+                {
+                    if (predicate > max) {
+                        return all.get();
+                    } else if (predicate <= min) {
+                        return empty.get();
+                    }
+                    break;
+                }
+            default:
+                throw new IllegalArgumentException("not support operation: " + operation);
+        }
+        return Optional.empty();
+    }
+
     /**
      * O'Neil bit-sliced index compare algorithm.
      *
@@ -133,7 +220,8 @@ private RoaringBitmap32 oNeilCompare(
     }
 
     /** Specifies O'Neil compare algorithm operation. */
-    private enum Operation {
+    @VisibleForTesting
+    protected enum Operation {
         EQ,
         NEQ,
         LTE,
@@ -151,8 +239,9 @@ public static BitSliceIndexRoaringBitmap map(DataInput in) throws IOException {
                             version));
         }
 
-        // deserialize min
+        // deserialize min & max
         long min = in.readLong();
+        long max = in.readLong();
 
         // deserialize ebm
         RoaringBitmap32 ebm = new RoaringBitmap32();
@@ -166,7 +255,7 @@ public static BitSliceIndexRoaringBitmap map(DataInput in) throws IOException {
             slices[i] = rb;
         }
 
-        return new BitSliceIndexRoaringBitmap(min, ebm, slices);
+        return new BitSliceIndexRoaringBitmap(min, max, ebm, slices);
     }
 
     /** A Builder for {@link BitSliceIndexRoaringBitmap}. */
@@ -220,6 +309,7 @@ public boolean isNotEmpty() {
         public void serialize(DataOutput out) throws IOException {
             out.writeByte(VERSION_1);
             out.writeLong(min);
+            out.writeLong(max);
             ebm.serialize(out);
             out.writeInt(slices.length);
             for (RoaringBitmap32 slice : slices) {
@@ -228,7 +318,7 @@ public void serialize(DataOutput out) throws IOException {
         }
 
         public BitSliceIndexRoaringBitmap build() throws IOException {
-            return new BitSliceIndexRoaringBitmap(min, ebm, slices);
+            return new BitSliceIndexRoaringBitmap(min, max, ebm, slices);
         }
     }
 }
diff --git a/paimon-common/src/test/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmapTest.java b/paimon-common/src/test/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmapTest.java
index 8c4a27d4351ee..83252a8bf1888 100644
--- a/paimon-common/src/test/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmapTest.java
+++ b/paimon-common/src/test/java/org/apache/paimon/utils/BitSliceIndexRoaringBitmapTest.java
@@ -26,34 +26,69 @@
 import java.io.DataInputStream;
 import java.io.DataOutputStream;
 import java.io.IOException;
-import java.util.stream.IntStream;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.Objects;
+import java.util.Optional;
+import java.util.Random;
 
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.EQ;
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.GT;
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.GTE;
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.LT;
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.LTE;
+import static org.apache.paimon.utils.BitSliceIndexRoaringBitmap.Operation.NEQ;
 import static org.assertj.core.api.Assertions.assertThat;
 
 /** Test for {@link BitSliceIndexRoaringBitmap}. */
 public class BitSliceIndexRoaringBitmapTest {
 
-    private long base;
+    public static final int NUM_OF_ROWS = 100000;
+    public static final int VALUE_BOUND = 1000;
+    public static final int VALUE_LT_MIN = 0;
+    public static final int VALUE_GT_MAX = VALUE_BOUND + 100;
+
+    private Random random;
+    private List<Pair> pairs;
     private BitSliceIndexRoaringBitmap bsi;
 
     @BeforeEach
     public void setup() throws IOException {
-        this.base = System.currentTimeMillis();
+        this.random = new Random();
+        List<Pair> pairs = new ArrayList<>();
+        long min = 0;
+        long max = 0;
+        for (int i = 0; i < NUM_OF_ROWS; i++) {
+            if (i % 5 == 0) {
+                pairs.add(new Pair(i, null));
+                continue;
+            }
+            long next = generateNextValue();
+            min = Math.min(min == 0 ? next : min, next);
+            max = Math.max(max == 0 ? next : max, next);
+            pairs.add(new Pair(i, next));
+        }
         BitSliceIndexRoaringBitmap.Appender appender =
-                new BitSliceIndexRoaringBitmap.Appender(base, toPredicate(100));
-        IntStream.range(0, 31).forEach(x -> appender.append(x, toPredicate(x)));
-        IntStream.range(51, 100).forEach(x -> appender.append(x, toPredicate(x)));
-        appender.append(100, toPredicate(30));
+                new BitSliceIndexRoaringBitmap.Appender(min, max);
+        for (Pair pair : pairs) {
+            if (pair.value == null) {
+                continue;
+            }
+            appender.append(pair.index, pair.value);
+        }
         this.bsi = appender.build();
+        this.pairs = Collections.unmodifiableList(pairs);
     }
 
     @Test
     public void testSerde() throws IOException {
         BitSliceIndexRoaringBitmap.Appender appender =
-                new BitSliceIndexRoaringBitmap.Appender(0, toPredicate(100));
-        IntStream.range(0, 31).forEach(x -> appender.append(x, toPredicate(x)));
-        IntStream.range(51, 100).forEach(x -> appender.append(x, toPredicate(x)));
-        appender.append(100, toPredicate(30));
+                new BitSliceIndexRoaringBitmap.Appender(0, 10);
+        appender.append(0, 0);
+        appender.append(1, 1);
+        appender.append(2, 2);
+        appender.append(10, 6);
 
         ByteArrayOutputStream out = new ByteArrayOutputStream();
         appender.serialize(new DataOutputStream(out));
@@ -65,60 +100,171 @@ public void testSerde() throws IOException {
 
     @Test
     public void testEQ() {
-        assertThat(bsi.eq(toPredicate(1))).isEqualTo(RoaringBitmap32.bitmapOf(1));
-        assertThat(bsi.eq(toPredicate(32))).isEqualTo(RoaringBitmap32.bitmapOf());
-        assertThat(bsi.eq(toPredicate(30))).isEqualTo(RoaringBitmap32.bitmapOf(30, 100));
+        // test predicate in the value bound
+        for (int i = 0; i < 10; i++) {
+            long predicate = generateNextValue();
+            assertThat(bsi.eq(predicate))
+                    .isEqualTo(
+                            pairs.stream()
+                                    .filter(x -> Objects.equals(x.value, predicate))
+                                    .map(x -> x.index)
+                                    .collect(
+                                            RoaringBitmap32::new,
+                                            RoaringBitmap32::add,
+                                            (x, y) -> x.or(y)));
+        }
+
+        // test predicate out of the value bound
+        assertThat(bsi.eq(VALUE_LT_MIN)).isEqualTo(new RoaringBitmap32());
+        assertThat(bsi.eq(VALUE_GT_MAX)).isEqualTo(new RoaringBitmap32());
     }
 
     @Test
     public void testLT() {
-        assertThat(bsi.lt(toPredicate(30)))
-                .isEqualTo(RoaringBitmap32.bitmapOf(IntStream.range(0, 30).toArray()));
-        assertThat(bsi.lt(toPredicate(45)))
-                .isEqualTo(
-                        RoaringBitmap32.bitmapOf(
-                                IntStream.concat(IntStream.range(0, 31), IntStream.range(100, 101))
-                                        .toArray()));
+        // test predicate in the value bound
+        for (int i = 0; i < 10; i++) {
+            long predicate = generateNextValue();
+            assertThat(bsi.lt(predicate))
+                    .isEqualTo(
+                            pairs.stream()
+                                    .filter(x -> x.value != null)
+                                    .filter(x -> x.value < predicate)
+                                    .map(x -> x.index)
+                                    .collect(
+                                            RoaringBitmap32::new,
+                                            RoaringBitmap32::add,
+                                            (x, y) -> x.or(y)));
+        }
+
+        // test predicate out of the value bound
+        assertThat(bsi.lt(VALUE_LT_MIN)).isEqualTo(new RoaringBitmap32());
+        assertThat(bsi.lt(VALUE_GT_MAX)).isEqualTo(bsi.isNotNull());
     }
 
     @Test
     public void testLTE() {
-        RoaringBitmap32 expected =
-                RoaringBitmap32.bitmapOf(
-                        IntStream.concat(IntStream.range(0, 31), IntStream.range(100, 101))
-                                .toArray());
-        assertThat(bsi.lte(toPredicate(30))).isEqualTo(expected);
-        assertThat(bsi.lte(toPredicate(45))).isEqualTo(expected);
+        // test predicate in the value bound
+        for (int i = 0; i < 10; i++) {
+            long predicate = generateNextValue();
+            assertThat(bsi.lte(predicate))
+                    .isEqualTo(
+                            pairs.stream()
+                                    .filter(x -> x.value != null)
+                                    .filter(x -> x.value <= predicate)
+                                    .map(x -> x.index)
+                                    .collect(
+                                            RoaringBitmap32::new,
+                                            RoaringBitmap32::add,
+                                            (x, y) -> x.or(y)));
+        }
+
+        // test predicate out of the value bound
+        assertThat(bsi.lte(VALUE_LT_MIN)).isEqualTo(new RoaringBitmap32());
+        assertThat(bsi.lte(VALUE_GT_MAX)).isEqualTo(bsi.isNotNull());
     }
 
     @Test
     public void testGT() {
-        RoaringBitmap32 expected = RoaringBitmap32.bitmapOf(IntStream.range(51, 100).toArray());
-        assertThat(bsi.gt(toPredicate(30))).isEqualTo(expected);
-        assertThat(bsi.gt(toPredicate(45))).isEqualTo(expected);
+        // test predicate in the value bound
+        for (int i = 0; i < 10; i++) {
+            long predicate = generateNextValue();
+            assertThat(bsi.gt(predicate))
+                    .isEqualTo(
+                            pairs.stream()
+                                    .filter(x -> x.value != null)
+                                    .filter(x -> x.value > predicate)
+                                    .map(x -> x.index)
+                                    .collect(
+                                            RoaringBitmap32::new,
+                                            RoaringBitmap32::add,
+                                            (x, y) -> x.or(y)));
+        }
+
+        // test predicate out of the value bound
+        assertThat(bsi.gt(VALUE_LT_MIN)).isEqualTo(bsi.isNotNull());
+        assertThat(bsi.gt(VALUE_GT_MAX)).isEqualTo(new RoaringBitmap32());
     }
 
     @Test
     public void testGTE() {
-        assertThat(bsi.gte(toPredicate(30)))
-                .isEqualTo(
-                        RoaringBitmap32.bitmapOf(
-                                IntStream.concat(IntStream.range(30, 31), IntStream.range(51, 101))
-                                        .toArray()));
-        assertThat(bsi.gte(toPredicate(45)))
-                .isEqualTo(RoaringBitmap32.bitmapOf(IntStream.range(51, 100).toArray()));
+        // test predicate in the value bound
+        for (int i = 0; i < 10; i++) {
+            long predicate = generateNextValue();
+            assertThat(bsi.gte(predicate))
+                    .isEqualTo(
+                            pairs.stream()
+                                    .filter(x -> x.value != null)
+                                    .filter(x -> x.value >= predicate)
+                                    .map(x -> x.index)
+                                    .collect(
+                                            RoaringBitmap32::new,
+                                            RoaringBitmap32::add,
+                                            (x, y) -> x.or(y)));
+        }
+
+        // test predicate out of the value bound
+        assertThat(bsi.gte(VALUE_LT_MIN)).isEqualTo(bsi.isNotNull());
+        assertThat(bsi.gte(VALUE_GT_MAX)).isEqualTo(new RoaringBitmap32());
     }
 
     @Test
     public void testIsNotNull() {
         assertThat(bsi.isNotNull())
                 .isEqualTo(
-                        RoaringBitmap32.bitmapOf(
-                                IntStream.concat(IntStream.range(0, 31), IntStream.range(51, 101))
-                                        .toArray()));
+                        pairs.stream()
+                                .filter(x -> x.value != null)
+                                .map(x -> x.index)
+                                .collect(
+                                        RoaringBitmap32::new,
+                                        RoaringBitmap32::add,
+                                        (x, y) -> x.or(y)));
     }
 
-    private long toPredicate(long predicate) {
-        return base + predicate;
+    @Test
+    public void testCompareUsingMinMax() {
+        // a predicate in the value bound
+        final int predicate = generateNextValue();
+        final Optional<RoaringBitmap32> empty = Optional.of(new RoaringBitmap32());
+        final Optional<RoaringBitmap32> notNul = Optional.of(bsi.isNotNull());
+        final Optional<RoaringBitmap32> inBound = Optional.empty();
+
+        // test eq & neq
+        assertThat(bsi.compareUsingMinMax(EQ, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(EQ, VALUE_LT_MIN, null)).isEqualTo(empty);
+        assertThat(bsi.compareUsingMinMax(EQ, VALUE_GT_MAX, null)).isEqualTo(empty);
+        assertThat(bsi.compareUsingMinMax(NEQ, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(NEQ, VALUE_LT_MIN, null)).isEqualTo(notNul);
+        assertThat(bsi.compareUsingMinMax(NEQ, VALUE_GT_MAX, null)).isEqualTo(notNul);
+
+        // test lt & lte
+        assertThat(bsi.compareUsingMinMax(LT, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(LTE, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(LT, VALUE_LT_MIN, null)).isEqualTo(empty);
+        assertThat(bsi.compareUsingMinMax(LTE, VALUE_LT_MIN, null)).isEqualTo(empty);
+        assertThat(bsi.compareUsingMinMax(LT, VALUE_GT_MAX, null)).isEqualTo(notNul);
+        assertThat(bsi.compareUsingMinMax(LTE, VALUE_GT_MAX, null)).isEqualTo(notNul);
+
+        // test gt & gte
+        assertThat(bsi.compareUsingMinMax(GT, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(GTE, predicate, null)).isEqualTo(inBound);
+        assertThat(bsi.compareUsingMinMax(GT, VALUE_LT_MIN, null)).isEqualTo(notNul);
+        assertThat(bsi.compareUsingMinMax(GTE, VALUE_LT_MIN, null)).isEqualTo(notNul);
+        assertThat(bsi.compareUsingMinMax(GT, VALUE_GT_MAX, null)).isEqualTo(empty);
+        assertThat(bsi.compareUsingMinMax(GT, VALUE_GT_MAX, null)).isEqualTo(empty);
+    }
+
+    private int generateNextValue() {
+        // return a value in the range [1, VALUE_BOUND)
+        return random.nextInt(VALUE_BOUND) + 1;
+    }
+
+    private static class Pair {
+        int index;
+        Long value;
+
+        public Pair(int index, Long value) {
+            this.index = index;
+            this.value = value;
+        }
     }
 }

From 026676549b9ae5f60f3f13ae1774933dd0705152 Mon Sep 17 00:00:00 2001
From: "aiden.dong" <782112163@qq.com>
Date: Wed, 4 Dec 2024 19:02:22 +0800
Subject: [PATCH 109/157] [core] Fix parquet nextRowPosition bug (#4636)

---
 .../table/PrimaryKeyFileStoreTableTest.java   | 61 ++++++++++++++++++-
 .../format/parquet/ParquetReaderFactory.java  |  2 +-
 2 files changed, 59 insertions(+), 4 deletions(-)

diff --git a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
index e80b49a0f05df..fa635e2ab6669 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/PrimaryKeyFileStoreTableTest.java
@@ -812,6 +812,27 @@ public void testDeletionVectorsWithFileIndexInFile() throws Exception {
 
     @Test
     public void testDeletionVectorsWithParquetFilter() throws Exception {
+        // RowGroup record range [pk] :
+        //
+        // RowGroup-0 :  [0-93421)
+        // RowGroup-1 :  [93421-187794)
+        // RowGroup-2 :  [187794-200000)
+        //
+        // ColumnPage record count :
+        //
+        // col-0 : 300
+        // col-1 : 200
+        // col-2 : 300
+        // col-3 : 300
+        // col-4 : 300
+        // col-5 : 200
+        // col-6 : 100
+        // col-7 : 100
+        // col-8 : 100
+        // col-9 : 100
+        // col-10 : 100
+        // col-11 : 300
+
         FileStoreTable table =
                 createFileStoreTable(
                         conf -> {
@@ -842,7 +863,11 @@ public void testDeletionVectorsWithParquetFilter() throws Exception {
                         writeBuilder
                                 .newWrite()
                                 .withIOManager(new IOManagerImpl(tempDir.toString()));
-        for (int i = 180000; i < 200000; i++) {
+        for (int i = 110000; i < 115000; i++) {
+            write.write(rowDataWithKind(RowKind.DELETE, 1, i, i * 100L));
+        }
+
+        for (int i = 130000; i < 135000; i++) {
             write.write(rowDataWithKind(RowKind.DELETE, 1, i, i * 100L));
         }
 
@@ -854,8 +879,10 @@ public void testDeletionVectorsWithParquetFilter() throws Exception {
         List<Split> splits = toSplits(table.newSnapshotReader().read().dataSplits());
         Random random = new Random();
 
+        // point filter
+
         for (int i = 0; i < 10; i++) {
-            int value = random.nextInt(180000);
+            int value = random.nextInt(110000);
             TableRead read = table.newRead().withFilter(builder.equal(1, value)).executeFilter();
             assertThat(getResult(read, splits, BATCH_ROW_TO_STRING))
                     .isEqualTo(
@@ -866,10 +893,38 @@ public void testDeletionVectorsWithParquetFilter() throws Exception {
         }
 
         for (int i = 0; i < 10; i++) {
-            int value = 180000 + random.nextInt(20000);
+            int value = 130000 + random.nextInt(5000);
             TableRead read = table.newRead().withFilter(builder.equal(1, value)).executeFilter();
             assertThat(getResult(read, splits, BATCH_ROW_TO_STRING)).isEmpty();
         }
+
+        TableRead tableRead =
+                table.newRead()
+                        .withFilter(
+                                PredicateBuilder.and(
+                                        builder.greaterOrEqual(1, 100000),
+                                        builder.lessThan(1, 150000)))
+                        .executeFilter();
+
+        List<String> result = getResult(tableRead, splits, BATCH_ROW_TO_STRING);
+
+        assertThat(result.size()).isEqualTo(40000); // filter 10000
+
+        assertThat(result)
+                .doesNotContain("1|110000|11000000|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result)
+                .doesNotContain("1|114999|11499900|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result)
+                .doesNotContain("1|130000|13000000|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result)
+                .doesNotContain("1|134999|13499900|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result).contains("1|100000|10000000|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result).contains("1|149999|14999900|binary|varbinary|mapKey:mapVal|multiset");
+
+        assertThat(result).contains("1|101099|10109900|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result).contains("1|115000|11500000|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result).contains("1|129999|12999900|binary|varbinary|mapKey:mapVal|multiset");
+        assertThat(result).contains("1|135000|13500000|binary|varbinary|mapKey:mapVal|multiset");
     }
 
     @Test
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
index 0c996531201a5..6f8cab2202d62 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/ParquetReaderFactory.java
@@ -491,7 +491,7 @@ private long getNextRowPosition(int num) {
                     nextIndex = this.currentRowGroupReadState.currentRangeStart();
                 }
 
-                return nextIndex;
+                return this.currentRowGroupFirstRowIndex + nextIndex;
             }
         }
 

From 66ca6984bac38a835bc42175ef8e639841b15476 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Wed, 4 Dec 2024 21:14:18 +0800
Subject: [PATCH 110/157] [core] Introduce manifest.delete-file-drop-stats
 (#4640)

---
 .../shortcodes/generated/core_configuration.html     |  6 ++++++
 .../src/main/java/org/apache/paimon/CoreOptions.java | 12 ++++++++++++
 .../java/org/apache/paimon/AbstractFileStore.java    |  1 +
 .../UnawareAppendTableCompactionCoordinator.java     |  4 +++-
 .../paimon/operation/AbstractFileStoreWrite.java     |  9 ++++++++-
 .../apache/paimon/operation/FileStoreCommitImpl.java |  7 ++++++-
 .../paimon/operation/MemoryFileStoreWrite.java       |  1 +
 .../apache/paimon/operation/FileStoreCommitTest.java |  1 +
 .../apache/paimon/spark/commands/PaimonCommand.scala |  5 ++++-
 9 files changed, 42 insertions(+), 4 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 2ad5db28b9ba1..6fb2c72650feb 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -453,6 +453,12 @@
             <td>String</td>
             <td>Default file compression for manifest.</td>
         </tr>
+        <tr>
+            <td><h5>manifest.delete-file-drop-stats</h5></td>
+            <td style="word-wrap: break-word;">false</td>
+            <td>Boolean</td>
+            <td>For DELETE manifest entry in manifest file, drop stats to reduce memory and storage. Default value is false only for compatibility of old reader.</td>
+        </tr>
         <tr>
             <td><h5>manifest.format</h5></td>
             <td style="word-wrap: break-word;">"avro"</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index cddef33c276e5..765d5a1e32d6b 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -1426,6 +1426,14 @@ public class CoreOptions implements Serializable {
                     .noDefaultValue()
                     .withDescription("The object location for object table.");
 
+    public static final ConfigOption<Boolean> MANIFEST_DELETE_FILE_DROP_STATS =
+            key("manifest.delete-file-drop-stats")
+                    .booleanType()
+                    .defaultValue(false)
+                    .withDescription(
+                            "For DELETE manifest entry in manifest file, drop stats to reduce memory and storage."
+                                    + " Default value is false only for compatibility of old reader.");
+
     @ExcludeFromDocumentation("Only used internally to support materialized table")
     public static final ConfigOption<String> MATERIALIZED_TABLE_DEFINITION_QUERY =
             key("materialized-table.definition-query")
@@ -1947,6 +1955,10 @@ public boolean needLookup() {
         return lookupStrategy().needLookup;
     }
 
+    public boolean manifestDeleteFileDropStats() {
+        return options.get(MANIFEST_DELETE_FILE_DROP_STATS);
+    }
+
     public LookupStrategy lookupStrategy() {
         return LookupStrategy.from(
                 mergeEngine().equals(MergeEngine.FIRST_ROW),
diff --git a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
index ae4552aa7150e..1a538ad89e479 100644
--- a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
@@ -218,6 +218,7 @@ public FileStoreCommitImpl newCommit(String commitUser, List<CommitCallback> cal
                 tableName,
                 commitUser,
                 partitionType,
+                options,
                 options.partitionDefaultName(),
                 pathFactory(),
                 snapshotManager(),
diff --git a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
index 5e43568aac3f1..490bda9d4cf1d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
+++ b/paimon-core/src/main/java/org/apache/paimon/append/UnawareAppendTableCompactionCoordinator.java
@@ -381,7 +381,9 @@ public FilesIterator(
                 snapshotReader.withFilter(filter);
             }
             // drop stats to reduce memory
-            snapshotReader.dropStats();
+            if (table.coreOptions().manifestDeleteFileDropStats()) {
+                snapshotReader.dropStats();
+            }
             this.streamingMode = isStreaming;
         }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
index 43957de8d6c14..14dfe75a6e357 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AbstractFileStoreWrite.java
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.operation;
 
+import org.apache.paimon.CoreOptions;
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.compact.CompactDeletionFile;
@@ -96,13 +97,19 @@ protected AbstractFileStoreWrite(
             @Nullable IndexMaintainer.Factory<T> indexFactory,
             @Nullable DeletionVectorsMaintainer.Factory dvMaintainerFactory,
             String tableName,
+            CoreOptions options,
             int totalBuckets,
             RowType partitionType,
             int writerNumberMax,
             boolean legacyPartitionName) {
         this.snapshotManager = snapshotManager;
+        this.scan = scan;
         // Statistic is useless in writer
-        this.scan = scan == null ? null : scan.dropStats();
+        if (options.manifestDeleteFileDropStats()) {
+            if (this.scan != null) {
+                this.scan.dropStats();
+            }
+        }
         this.indexFactory = indexFactory;
         this.dvMaintainerFactory = dvMaintainerFactory;
         this.totalBuckets = totalBuckets;
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index bbd9b27ee6572..153f9f07e9ffd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.operation;
 
+import org.apache.paimon.CoreOptions;
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.data.BinaryRow;
@@ -146,6 +147,7 @@ public FileStoreCommitImpl(
             String tableName,
             String commitUser,
             RowType partitionType,
+            CoreOptions options,
             String partitionDefaultName,
             FileStorePathFactory pathFactory,
             SnapshotManager snapshotManager,
@@ -176,8 +178,11 @@ public FileStoreCommitImpl(
         this.manifestFile = manifestFileFactory.create();
         this.manifestList = manifestListFactory.create();
         this.indexManifestFile = indexManifestFileFactory.create();
+        this.scan = scan;
         // Stats in DELETE Manifest Entries is useless
-        this.scan = scan.dropStats();
+        if (options.manifestDeleteFileDropStats()) {
+            this.scan.dropStats();
+        }
         this.numBucket = numBucket;
         this.manifestTargetSize = manifestTargetSize;
         this.manifestFullCompactionSize = manifestFullCompactionSize;
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/MemoryFileStoreWrite.java b/paimon-core/src/main/java/org/apache/paimon/operation/MemoryFileStoreWrite.java
index ff99f06510c93..a2733121eece1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/MemoryFileStoreWrite.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/MemoryFileStoreWrite.java
@@ -73,6 +73,7 @@ public MemoryFileStoreWrite(
                 indexFactory,
                 dvMaintainerFactory,
                 tableName,
+                options,
                 options.bucket(),
                 partitionType,
                 options.writeMaxWritersToSpill(),
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
index de4ee684b830f..9e4ba30eb8786 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/FileStoreCommitTest.java
@@ -950,6 +950,7 @@ public void testManifestCompact() throws Exception {
     @Test
     public void testDropStatsForOverwrite() throws Exception {
         TestFileStore store = createStore(false);
+        store.options().toConfiguration().set(CoreOptions.MANIFEST_DELETE_FILE_DROP_STATS, true);
 
         List<KeyValue> keyValues = generateDataList(1);
         BinaryRow partition = gen.getPartition(keyValues.get(0));
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
index 466643b157097..87583593e3fe8 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/commands/PaimonCommand.scala
@@ -94,8 +94,11 @@ trait PaimonCommand extends WithFileStoreTable with ExpressionHelper with SQLCon
       condition: Expression,
       output: Seq[Attribute]): Seq[DataSplit] = {
     // low level snapshot reader, it can not be affected by 'scan.mode'
+    val snapshotReader = table.newSnapshotReader()
     // dropStats after filter push down
-    val snapshotReader = table.newSnapshotReader().dropStats()
+    if (table.coreOptions().manifestDeleteFileDropStats()) {
+      snapshotReader.dropStats()
+    }
     if (condition != TrueLiteral) {
       val filter =
         convertConditionToPaimonPredicate(condition, output, rowType, ignoreFailure = true)

From aec25472882ff6e27da793e82fd56f47d6cf5eef Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Wed, 4 Dec 2024 21:15:56 +0800
Subject: [PATCH 111/157] [core] Make commit.max-retries behave as it means
 (#4641)

---
 .../paimon/operation/FileStoreCommitImpl.java | 53 ++++++++++---------
 1 file changed, 27 insertions(+), 26 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index 153f9f07e9ffd..4808975fa763c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -721,21 +721,10 @@ private int tryCommit(
             ConflictCheck conflictCheck,
             String branchName,
             @Nullable String statsFileName) {
-        int cnt = 0;
+        int retryCount = 0;
         RetryResult retryResult = null;
         while (true) {
             Snapshot latestSnapshot = snapshotManager.latestSnapshot();
-            cnt++;
-            if (cnt >= commitMaxRetries) {
-                if (retryResult != null) {
-                    retryResult.cleanAll();
-                }
-                throw new RuntimeException(
-                        String.format(
-                                "Commit failed after %s attempts, there maybe exist commit conflicts between multiple jobs.",
-                                commitMaxRetries));
-            }
-
             CommitResult result =
                     tryCommitOnce(
                             retryResult,
@@ -756,8 +745,19 @@ private int tryCommit(
             }
 
             retryResult = (RetryResult) result;
+
+            if (retryCount >= commitMaxRetries) {
+                if (retryResult != null) {
+                    retryResult.cleanAll();
+                }
+                throw new RuntimeException(
+                        String.format(
+                                "Commit failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
+                                commitMaxRetries));
+            }
+            retryCount++;
         }
-        return cnt;
+        return retryCount + 1;
     }
 
     private int tryOverwrite(
@@ -767,17 +767,10 @@ private int tryOverwrite(
             long identifier,
             @Nullable Long watermark,
             Map<Integer, Long> logOffsets) {
-        int cnt = 0;
+        int retryCount = 0;
         while (true) {
             Snapshot latestSnapshot = snapshotManager.latestSnapshot();
 
-            cnt++;
-            if (cnt >= commitMaxRetries) {
-                throw new RuntimeException(
-                        String.format(
-                                "Commit failed after %s attempts, there maybe exist commit conflicts between multiple jobs.",
-                                commitMaxRetries));
-            }
             List<ManifestEntry> changesWithOverwrite = new ArrayList<>();
             List<IndexManifestEntry> indexChangesWithOverwrite = new ArrayList<>();
             if (latestSnapshot != null) {
@@ -833,8 +826,16 @@ private int tryOverwrite(
             // TODO optimize OVERWRITE too
             RetryResult retryResult = (RetryResult) result;
             retryResult.cleanAll();
+
+            if (retryCount >= commitMaxRetries) {
+                throw new RuntimeException(
+                        String.format(
+                                "Commit failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
+                                commitMaxRetries));
+            }
+            retryCount++;
         }
-        return cnt;
+        return retryCount + 1;
     }
 
     @VisibleForTesting
@@ -1074,22 +1075,22 @@ CommitResult tryCommitOnce(
     }
 
     public void compactManifest() {
-        int cnt = 0;
+        int retryCount = 0;
         ManifestCompactResult retryResult = null;
         while (true) {
-            cnt++;
             retryResult = compactManifest(retryResult);
             if (retryResult.isSuccess()) {
                 break;
             }
 
-            if (cnt >= commitMaxRetries) {
+            if (retryCount >= commitMaxRetries) {
                 retryResult.cleanAll();
                 throw new RuntimeException(
                         String.format(
-                                "Commit compact manifest failed after %s attempts, there maybe exist commit conflicts between multiple jobs.",
+                                "Commit compact manifest failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
                                 commitMaxRetries));
             }
+            retryCount++;
         }
     }
 

From 812ef057a08f3bded463d6391996bd2595f4bd38 Mon Sep 17 00:00:00 2001
From: "aiden.dong" <782112163@qq.com>
Date: Wed, 4 Dec 2024 21:33:32 +0800
Subject: [PATCH 112/157] [core] Add parquet write page limit parameter (#4632)

---
 .../paimon/format/parquet/writer/RowDataParquetBuilder.java   | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/writer/RowDataParquetBuilder.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/writer/RowDataParquetBuilder.java
index da55f94942fd6..6ec349c124daa 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/writer/RowDataParquetBuilder.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/writer/RowDataParquetBuilder.java
@@ -60,6 +60,10 @@ public ParquetWriter<InternalRow> createWriter(OutputFile out, String compressio
                                 conf.getInt(
                                         ParquetOutputFormat.PAGE_SIZE,
                                         ParquetWriter.DEFAULT_PAGE_SIZE))
+                        .withPageRowCountLimit(
+                                conf.getInt(
+                                        ParquetOutputFormat.PAGE_ROW_COUNT_LIMIT,
+                                        ParquetProperties.DEFAULT_PAGE_ROW_COUNT_LIMIT))
                         .withDictionaryPageSize(
                                 conf.getInt(
                                         ParquetOutputFormat.DICTIONARY_PAGE_SIZE,

From 4bf2d9b01d0176bdf52e68dd996cbe79f4304d14 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Thu, 5 Dec 2024 23:57:05 +0800
Subject: [PATCH 113/157] [flink] Fix that 'values-time' partition expire might
 throw NPE (#4646)

---
 .../PartitionValuesTimeExpireStrategy.java    | 21 ++++++++++++++-----
 .../ExpirePartitionsProcedureITCase.java      | 13 ++++++++++++
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/partition/PartitionValuesTimeExpireStrategy.java b/paimon-core/src/main/java/org/apache/paimon/partition/PartitionValuesTimeExpireStrategy.java
index 80ae633fd2970..51c53282c476a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/partition/PartitionValuesTimeExpireStrategy.java
+++ b/paimon-core/src/main/java/org/apache/paimon/partition/PartitionValuesTimeExpireStrategy.java
@@ -81,23 +81,34 @@ public boolean test(BinaryRow partition) {
                 LocalDateTime partTime = timeExtractor.extract(partitionKeys, Arrays.asList(array));
                 return expireDateTime.isAfter(partTime);
             } catch (DateTimeParseException e) {
-                String partitionInfo =
-                        IntStream.range(0, partitionKeys.size())
-                                .mapToObj(i -> partitionKeys.get(i) + ":" + array[i])
-                                .collect(Collectors.joining(","));
                 LOG.warn(
                         "Can't extract datetime from partition {}. If you want to configure partition expiration, please:\n"
                                 + "  1. Check the expiration configuration.\n"
                                 + "  2. Manually delete the partition using the drop-partition command if the partition"
                                 + " value is non-date formatted.\n"
                                 + "  3. Use '{}' expiration strategy by set '{}', which supports non-date formatted partition.",
-                        partitionInfo,
+                        formatPartitionInfo(array),
+                        CoreOptions.PartitionExpireStrategy.UPDATE_TIME,
+                        CoreOptions.PARTITION_EXPIRATION_STRATEGY.key());
+                return false;
+            } catch (NullPointerException e) {
+                // there might exist NULL partition value
+                LOG.warn(
+                        "This partition {} cannot be expired because it contains null value. "
+                                + "You can try to drop it manually or use '{}' expiration strategy by set '{}'.",
+                        formatPartitionInfo(array),
                         CoreOptions.PartitionExpireStrategy.UPDATE_TIME,
                         CoreOptions.PARTITION_EXPIRATION_STRATEGY.key());
                 return false;
             }
         }
 
+        private String formatPartitionInfo(Object[] array) {
+            return IntStream.range(0, partitionKeys.size())
+                    .mapToObj(i -> partitionKeys.get(i) + ":" + array[i])
+                    .collect(Collectors.joining(","));
+        }
+
         @Override
         public boolean test(
                 long rowCount,
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
index bc2e84902f35a..2d1fb6dde78a2 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
@@ -402,6 +402,19 @@ public void testSortAndLimitExpirePartition() throws Exception {
                 .containsExactlyInAnyOrder("4:2024-06-03:01:00", "Never-expire:9999-09-09:99:99");
     }
 
+    @Test
+    public void testNullPartitionExpire() {
+        sql("CREATE TABLE T (k INT, ds STRING) PARTITIONED BY (ds);");
+        sql("INSERT INTO T VALUES (1, CAST (NULL AS STRING))");
+        assertThat(
+                        callExpirePartitions(
+                                "CALL sys.expire_partitions("
+                                        + "`table` => 'default.T'"
+                                        + ", expiration_time => '1 d'"
+                                        + ", timestamp_formatter => 'yyyyMMdd')"))
+                .containsExactly("No expired partitions.");
+    }
+
     /** Return a list of expired partitions. */
     public List<String> callExpirePartitions(String callSql) {
         return sql(callSql).stream()

From 315f8c0dbb01e9883513782fa889bcaec9ea8c72 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Fri, 6 Dec 2024 15:49:36 +0800
Subject: [PATCH 114/157] [spark] Support show create and describe view (#4645)

---
 docs/content/spark/auxiliary.md               |  19 ++-
 docs/content/spark/sql-ddl.md                 |  48 +++++--
 .../analysis/PaimonViewResolver.scala         |  21 +++-
 .../spark/execution/PaimonStrategy.scala      |   9 +-
 .../spark/execution/PaimonViewExec.scala      | 117 +++++++++++++++++-
 .../paimon/spark/sql/PaimonViewTestBase.scala |  62 ++++++++++
 6 files changed, 257 insertions(+), 19 deletions(-)

diff --git a/docs/content/spark/auxiliary.md b/docs/content/spark/auxiliary.md
index 5de0289565f2f..a53adfcce1001 100644
--- a/docs/content/spark/auxiliary.md
+++ b/docs/content/spark/auxiliary.md
@@ -61,18 +61,18 @@ SELECT * FROM default.T1 JOIN default.T2 ON xxxx;
 ```
 
 ## Describe table
-DESCRIBE TABLE statement returns the basic metadata information of a table. The metadata information includes column name, column type and column comment.
+DESCRIBE TABLE statement returns the basic metadata information of a table or view. The metadata information includes column name, column type and column comment.
 
 ```sql
--- describe table
+-- describe table or view
 DESCRIBE TABLE my_table;
 
--- describe table with additional metadata
+-- describe table or view with additional metadata
 DESCRIBE TABLE EXTENDED my_table;
 ```
 
 ## Show create table
-SHOW CREATE TABLE returns the CREATE TABLE statement that was used to create a given table.
+SHOW CREATE TABLE returns the CREATE TABLE statement or CREATE VIEW statement that was used to create a given table or view.
 
 ```sql
 SHOW CREATE TABLE my_table;
@@ -107,6 +107,17 @@ SHOW TABLE EXTENDED IN db_name LIKE 'test*';
 SHOW TABLE EXTENDED IN db_name LIKE 'table_name' PARTITION(pt = '2024');
 ```
 
+## Show views
+The SHOW VIEWS statement returns all the views for an optionally specified database.
+
+```sql
+-- Lists all views
+SHOW VIEWS;
+
+-- Lists all views that satisfy regular expressions
+SHOW VIEWS LIKE 'test*';
+```
+
 ## Analyze table
 
 The ANALYZE TABLE statement collects statistics about the table, that are to be used by the query optimizer to find a better query execution plan.
diff --git a/docs/content/spark/sql-ddl.md b/docs/content/spark/sql-ddl.md
index 4a82d6b4a4382..638a21a7042aa 100644
--- a/docs/content/spark/sql-ddl.md
+++ b/docs/content/spark/sql-ddl.md
@@ -26,7 +26,9 @@ under the License.
 
 # SQL DDL
 
-## Create Catalog
+## Catalog
+
+### Create Catalog
 
 Paimon catalogs currently support three types of metastores:
 
@@ -36,7 +38,7 @@ Paimon catalogs currently support three types of metastores:
 
 See [CatalogOptions]({{< ref "maintenance/configurations#catalogoptions" >}}) for detailed options when creating a catalog.
 
-### Create Filesystem Catalog
+#### Create Filesystem Catalog
 
 The following Spark SQL registers and uses a Paimon catalog named `my_catalog`. Metadata and table files are stored under `hdfs:///path/to/warehouse`.
 
@@ -56,7 +58,7 @@ After `spark-sql` is started, you can switch to the `default` database of the `p
 USE paimon.default;
 ```
 
-### Creating Hive Catalog
+#### Creating Hive Catalog
 
 By using Paimon Hive catalog, changes to the catalog will directly affect the corresponding Hive metastore. Tables created in such catalog can also be accessed directly from Hive.
 
@@ -84,13 +86,13 @@ USE paimon.default;
 
 Also, you can create [SparkGenericCatalog]({{< ref "spark/quick-start" >}}).
 
-#### Synchronizing Partitions into Hive Metastore
+**Synchronizing Partitions into Hive Metastore**
 
 By default, Paimon does not synchronize newly created partitions into Hive metastore. Users will see an unpartitioned table in Hive. Partition push-down will be carried out by filter push-down instead.
 
 If you want to see a partitioned table in Hive and also synchronize newly created partitions into Hive metastore, please set the table property `metastore.partitioned-table` to true. Also see [CoreOptions]({{< ref "maintenance/configurations#coreoptions" >}}).
 
-### Creating JDBC Catalog
+#### Creating JDBC Catalog
 
 By using the Paimon JDBC catalog, changes to the catalog will be directly stored in relational databases such as SQLite, MySQL, postgres, etc.
 
@@ -118,7 +120,9 @@ spark-sql ... \
 USE paimon.default;
 ```
 
-## Create Table
+## Table
+
+### Create Table
 
 After use Paimon catalog, you can create and drop tables. Tables created in Paimon Catalogs are managed by the catalog.
 When the table is dropped from catalog, its table files will also be deleted.
@@ -152,7 +156,7 @@ CREATE TABLE my_table (
 );
 ```
 
-## Create Table As Select
+### Create Table As Select
 
 Table can be created and populated by the results of a query, for example, we have a sql like this: `CREATE TABLE table_b AS SELECT id, name FORM table_a`,
 The resulting table `table_b` will be equivalent to create the table and insert the data with the following statement:
@@ -210,8 +214,34 @@ CREATE TABLE my_table_all (
 CREATE TABLE my_table_all_as PARTITIONED BY (dt) TBLPROPERTIES ('primary-key' = 'dt,hh') AS SELECT * FROM my_table_all;
 ```
 
-## Tag DDL
-### Create or replace Tag
+## View
+
+Views are based on the result-set of an SQL query, when using `org.apache.paimon.spark.SparkCatalog`, views are managed by paimon itself. 
+And in this case, views are supported when the `metastore` type is `hive`, and temporary views are not supported yet.
+
+### Create Or Replace View
+
+CREATE VIEW constructs a virtual table that has no physical data.
+
+```sql
+-- create a view.
+CREATE VIEW v1 AS SELECT * FROM t1;
+
+-- create a view, if a view of same name already exists, it will be replaced.
+CREATE OR REPLACE VIEW v1 AS SELECT * FROM t1;
+```
+
+### Drop View
+
+DROP VIEW removes the metadata associated with a specified view from the catalog.
+
+```sql
+-- drop a view
+DROP VIEW v1;
+```
+
+## Tag
+### Create or Replace Tag
 Create or replace a tag syntax with the following options.
 - Create a tag with or without the snapshot id and time retention.
 - Create an existed tag is not failed if using `IF NOT EXISTS` syntax.
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
index a375a296583ec..3da0ddab64172 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/analysis/PaimonViewResolver.scala
@@ -24,13 +24,13 @@ import org.apache.paimon.spark.catalog.SupportView
 import org.apache.paimon.view.View
 
 import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.catalyst.analysis.{GetColumnByOrdinal, UnresolvedRelation}
-import org.apache.spark.sql.catalyst.expressions.{Alias, UpCast}
+import org.apache.spark.sql.catalyst.analysis.{GetColumnByOrdinal, UnresolvedRelation, UnresolvedTableOrView}
+import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute, UpCast}
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.parser.extensions.{CurrentOrigin, Origin}
-import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, Project, SubqueryAlias}
+import org.apache.spark.sql.catalyst.plans.logical.{LeafNode, LogicalPlan, Project, SubqueryAlias}
 import org.apache.spark.sql.catalyst.rules.Rule
-import org.apache.spark.sql.connector.catalog.PaimonLookupCatalog
+import org.apache.spark.sql.connector.catalog.{Identifier, PaimonLookupCatalog}
 
 case class PaimonViewResolver(spark: SparkSession)
   extends Rule[LogicalPlan]
@@ -47,6 +47,15 @@ case class PaimonViewResolver(spark: SparkSession)
         case _: ViewNotExistException =>
           u
       }
+
+    case u @ UnresolvedTableOrView(CatalogAndIdentifier(catalog: SupportView, ident), _, _) =>
+      try {
+        catalog.loadView(ident)
+        ResolvedPaimonView(catalog, ident)
+      } catch {
+        case _: ViewNotExistException =>
+          u
+      }
   }
 
   private def createViewRelation(nameParts: Seq[String], view: View): LogicalPlan = {
@@ -83,3 +92,7 @@ case class PaimonViewResolver(spark: SparkSession)
     }
   }
 }
+
+case class ResolvedPaimonView(catalog: SupportView, identifier: Identifier) extends LeafNode {
+  override def output: Seq[Attribute] = Nil
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
index 0c3865f7d979a..fb7bc6b22cd34 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonStrategy.scala
@@ -20,13 +20,14 @@ package org.apache.paimon.spark.execution
 
 import org.apache.paimon.spark.{SparkCatalog, SparkUtils}
 import org.apache.paimon.spark.catalog.SupportView
+import org.apache.paimon.spark.catalyst.analysis.ResolvedPaimonView
 import org.apache.paimon.spark.catalyst.plans.logical.{CreateOrReplaceTagCommand, CreatePaimonView, DeleteTagCommand, DropPaimonView, PaimonCallCommand, RenameTagCommand, ResolvedIdentifier, ShowPaimonViews, ShowTagsCommand}
 
 import org.apache.spark.sql.{SparkSession, Strategy}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.ResolvedNamespace
 import org.apache.spark.sql.catalyst.expressions.{Expression, GenericInternalRow, PredicateHelper}
-import org.apache.spark.sql.catalyst.plans.logical.{CreateTableAsSelect, LogicalPlan}
+import org.apache.spark.sql.catalyst.plans.logical.{CreateTableAsSelect, DescribeRelation, LogicalPlan, ShowCreateTable}
 import org.apache.spark.sql.connector.catalog.{Identifier, PaimonLookupCatalog, TableCatalog}
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.shim.PaimonCreateTableAsSelectStrategy
@@ -100,6 +101,12 @@ case class PaimonStrategy(spark: SparkSession)
         if r.catalog.isInstanceOf[SupportView] =>
       ShowPaimonViewsExec(output, r.catalog.asInstanceOf[SupportView], r.namespace, pattern) :: Nil
 
+    case ShowCreateTable(ResolvedPaimonView(viewCatalog, ident), _, output) =>
+      ShowCreatePaimonViewExec(output, viewCatalog, ident) :: Nil
+
+    case DescribeRelation(ResolvedPaimonView(viewCatalog, ident), _, isExtended, output) =>
+      DescribePaimonViewExec(output, viewCatalog, ident, isExtended) :: Nil
+
     case _ => Nil
   }
 
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
index 7a4b907c72f12..2282f7c34411a 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/execution/PaimonViewExec.scala
@@ -20,10 +20,12 @@ package org.apache.paimon.spark.execution
 
 import org.apache.paimon.spark.catalog.SupportView
 import org.apache.paimon.spark.leafnode.PaimonLeafV2CommandExec
+import org.apache.paimon.view.View
 
 import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.catalog.CatalogTable
 import org.apache.spark.sql.catalyst.expressions.{Attribute, GenericInternalRow}
-import org.apache.spark.sql.catalyst.util.StringUtils
+import org.apache.spark.sql.catalyst.util.{escapeSingleQuotedString, quoteIfNeeded, StringUtils}
 import org.apache.spark.sql.connector.catalog.Identifier
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.unsafe.types.UTF8String
@@ -115,3 +117,116 @@ case class ShowPaimonViewsExec(
     s"ShowPaimonViewsExec: $namespace"
   }
 }
+
+case class ShowCreatePaimonViewExec(output: Seq[Attribute], catalog: SupportView, ident: Identifier)
+  extends PaimonLeafV2CommandExec {
+
+  override protected def run(): Seq[InternalRow] = {
+    val view = catalog.loadView(ident)
+
+    val builder = new StringBuilder
+    builder ++= s"CREATE VIEW ${view.fullName()} "
+    showDataColumns(view, builder)
+    showComment(view, builder)
+    showProperties(view, builder)
+    builder ++= s"AS\n${view.query}\n"
+
+    Seq(new GenericInternalRow(values = Array(UTF8String.fromString(builder.toString))))
+  }
+
+  private def showDataColumns(view: View, builder: StringBuilder): Unit = {
+    if (view.rowType().getFields.size() > 0) {
+      val viewColumns = view.rowType().getFields.asScala.map {
+        f =>
+          val comment = if (f.description() != null) s" COMMENT '${f.description()}'" else ""
+          // view columns shouldn't have data type info
+          s"${quoteIfNeeded(f.name)}$comment"
+      }
+      builder ++= concatByMultiLines(viewColumns)
+    }
+  }
+
+  private def showComment(view: View, builder: StringBuilder): Unit = {
+    if (view.comment().isPresent) {
+      builder ++= s"COMMENT '${view.comment().get()}'\n"
+    }
+  }
+
+  private def showProperties(view: View, builder: StringBuilder): Unit = {
+    if (!view.options().isEmpty) {
+      val props = view.options().asScala.toSeq.sortBy(_._1).map {
+        case (key, value) =>
+          s"'${escapeSingleQuotedString(key)}' = '${escapeSingleQuotedString(value)}'"
+      }
+      builder ++= s"TBLPROPERTIES ${concatByMultiLines(props)}"
+    }
+  }
+
+  private def concatByMultiLines(iter: Iterable[String]): String = {
+    iter.mkString("(\n  ", ",\n  ", ")\n")
+  }
+
+  override def simpleString(maxFields: Int): String = {
+    s"ShowCreatePaimonViewExec: $ident"
+  }
+}
+
+case class DescribePaimonViewExec(
+    output: Seq[Attribute],
+    catalog: SupportView,
+    ident: Identifier,
+    isExtended: Boolean)
+  extends PaimonLeafV2CommandExec {
+
+  override protected def run(): Seq[InternalRow] = {
+    val rows = new ArrayBuffer[InternalRow]()
+    val view = catalog.loadView(ident)
+
+    describeColumns(view, rows)
+    if (isExtended) {
+      describeExtended(view, rows)
+    }
+
+    rows.toSeq
+  }
+
+  private def describeColumns(view: View, rows: ArrayBuffer[InternalRow]) = {
+    view
+      .rowType()
+      .getFields
+      .asScala
+      .map(f => rows += row(f.name(), f.`type`().toString, f.description()))
+  }
+
+  private def describeExtended(view: View, rows: ArrayBuffer[InternalRow]) = {
+    rows += row("", "", "")
+    rows += row("# Detailed View Information", "", "")
+    rows += row("Name", view.fullName(), "")
+    rows += row("Comment", view.comment().orElse(""), "")
+    rows += row("View Text", view.query, "")
+    rows += row(
+      "View Query Output Columns",
+      view.rowType().getFieldNames.asScala.mkString("[", ", ", "]"),
+      "")
+    rows += row(
+      "View Properties",
+      view
+        .options()
+        .asScala
+        .toSeq
+        .sortBy(_._1)
+        .map { case (k, v) => s"$k=$v" }
+        .mkString("[", ", ", "]"),
+      "")
+  }
+
+  private def row(s1: String, s2: String, s3: String): InternalRow = {
+    new GenericInternalRow(
+      values =
+        Array(UTF8String.fromString(s1), UTF8String.fromString(s2), UTF8String.fromString(s3)))
+  }
+
+  override def simpleString(maxFields: Int): String = {
+    s"DescribePaimonViewExec: $ident"
+  }
+}
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
index 39ed8e8a769d3..00f5566ed47af 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonViewTestBase.scala
@@ -93,4 +93,66 @@ abstract class PaimonViewTestBase extends PaimonHiveTestBase {
         }
     }
   }
+
+  test("Paimon View: show create view") {
+    sql(s"USE $paimonHiveCatalogName")
+    withDatabase("test_db") {
+      sql("CREATE DATABASE test_db")
+      sql("USE test_db")
+      withTable("t") {
+        withView("v") {
+          sql("CREATE TABLE t (id INT, c STRING) USING paimon")
+          sql("""
+                |CREATE VIEW v
+                |COMMENT 'test comment'
+                |TBLPROPERTIES ('k1' = 'v1')
+                |AS SELECT * FROM t
+                |""".stripMargin)
+
+          val s = sql("SHOW CREATE TABLE v").collectAsList().get(0).get(0).toString
+          val r = """
+                    |CREATE VIEW test_db.v \(
+                    |  id,
+                    |  c\)
+                    |COMMENT 'test comment'
+                    |TBLPROPERTIES \(
+                    |  'k1' = 'v1',
+                    |  'transient_lastDdlTime' = '\d+'\)
+                    |AS
+                    |SELECT \* FROM t
+                    |""".stripMargin.replace("\n", "").r
+          assert(r.findFirstIn(s.replace("\n", "")).isDefined)
+        }
+      }
+    }
+  }
+
+  test("Paimon View: describe [extended] view") {
+    sql(s"USE $paimonHiveCatalogName")
+    withDatabase("test_db") {
+      sql("CREATE DATABASE test_db")
+      sql("USE test_db")
+      withTable("t") {
+        withView("v") {
+          sql("CREATE TABLE t (id INT, c STRING) USING paimon")
+          sql("""
+                |CREATE VIEW v
+                |COMMENT 'test comment'
+                |TBLPROPERTIES ('k1' = 'v1')
+                |AS SELECT * FROM t
+                |""".stripMargin)
+
+          checkAnswer(sql("DESC TABLE v"), Seq(Row("id", "INT", null), Row("c", "STRING", null)))
+
+          val rows = sql("DESC TABLE EXTENDED v").collectAsList()
+          assert(rows.get(3).toString().equals("[# Detailed View Information,,]"))
+          assert(rows.get(4).toString().equals("[Name,test_db.v,]"))
+          assert(rows.get(5).toString().equals("[Comment,test comment,]"))
+          assert(rows.get(6).toString().equals("[View Text,SELECT * FROM t,]"))
+          assert(rows.get(7).toString().equals("[View Query Output Columns,[id, c],]"))
+          assert(rows.get(8).toString().contains("[View Properties,[k1=v1"))
+        }
+      }
+    }
+  }
 }

From 69bdfe089089e3c718a0df57662f7996d778f75d Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Sat, 7 Dec 2024 00:15:37 +0800
Subject: [PATCH 115/157] [test][spark] Add insert with column list test case
 (#4654)

---
 docs/content/spark/sql-write.md               | 39 +++++++++-----
 .../sql/InsertOverwriteTableTestBase.scala    | 52 +++++++++++++++++++
 2 files changed, 79 insertions(+), 12 deletions(-)

diff --git a/docs/content/spark/sql-write.md b/docs/content/spark/sql-write.md
index d2777110914f1..5f4fa2dabc9f6 100644
--- a/docs/content/spark/sql-write.md
+++ b/docs/content/spark/sql-write.md
@@ -26,17 +26,30 @@ under the License.
 
 # SQL Write
 
-## Syntax
+## Insert Table
+
+The `INSERT` statement inserts new rows into a table or overwrites the existing data in the table. The inserted rows can be specified by value expressions or result from a query.
+
+**Syntax**
 
 ```sql
 INSERT { INTO | OVERWRITE } table_identifier [ part_spec ] [ column_list ] { value_expr | query };
 ```
+**Parameters**
+
+- **table_identifier**: Specifies a table name, which may be optionally qualified with a database name. 
+
+- **part_spec**: An optional parameter that specifies a comma-separated list of key and value pairs for partitions.
 
-For more information, please check the syntax document:
+- **column_list**: An optional parameter that specifies a comma-separated list of columns belonging to the table_identifier table. Spark will reorder the columns of the input query to match the table schema according to the specified column list.
 
-[Spark INSERT Statement](https://spark.apache.org/docs/latest/sql-ref-syntax-dml-insert-table.html)
+  Note: Since Spark 3.4, INSERT INTO commands with explicit column lists comprising fewer columns than the target table will automatically add the corresponding default values for the remaining columns (or NULL for any column lacking an explicitly-assigned default value). In Spark 3.3 or earlier, column_list's size must be equal to the target table's column size, otherwise these commands would have failed.
 
-## INSERT INTO
+- **value_expr** ( { value | NULL } [ , … ] ) [ , ( … ) ]: Specifies the values to be inserted. Either an explicitly specified value or a NULL can be inserted. A comma must be used to separate each value in the clause. More than one set of values can be specified to insert multiple rows.
+
+For more information, please check the syntax document: [Spark INSERT Statement](https://spark.apache.org/docs/latest/sql-ref-syntax-dml-insert-table.html)
+
+### Insert Into
 
 Use `INSERT INTO` to apply records and changes to tables.
 
@@ -44,15 +57,15 @@ Use `INSERT INTO` to apply records and changes to tables.
 INSERT INTO my_table SELECT ...
 ```
 
-## Overwriting the Whole Table
+### Insert Overwrite
 
-Use `INSERT OVERWRITE` to overwrite the whole unpartitioned table.
+Use `INSERT OVERWRITE` to overwrite the whole table.
 
 ```sql
 INSERT OVERWRITE my_table SELECT ...
 ```
 
-### Overwriting a Partition
+#### Insert Overwrite Partition
 
 Use `INSERT OVERWRITE` to overwrite a partition.
 
@@ -60,7 +73,7 @@ Use `INSERT OVERWRITE` to overwrite a partition.
 INSERT OVERWRITE my_table PARTITION (key1 = value1, key2 = value2, ...) SELECT ...
 ```
 
-### Dynamic Overwrite
+#### Dynamic Overwrite Partition
 
 Spark's default overwrite mode is `static` partition overwrite. To enable dynamic overwritten you need to set the Spark session configuration `spark.sql.sources.partitionOverwriteMode` to `dynamic`
 
@@ -97,13 +110,15 @@ SELECT * FROM my_table;
 */
 ```
 
-## Truncate tables
+## Truncate Table
+
+The `TRUNCATE TABLE` statement removes all the rows from a table or partition(s).
 
 ```sql
 TRUNCATE TABLE my_table;
 ```
 
-## Updating tables
+## Update Table
 
 spark supports update PrimitiveType and StructType, for example:
 
@@ -125,13 +140,13 @@ UPDATE t SET name = 'a_new' WHERE id = 1;
 UPDATE t SET s.c2 = 'a_new' WHERE s.c1 = 1;
 ```
 
-## Deleting from table
+## Delete From Table
 
 ```sql
 DELETE FROM my_table WHERE currency = 'UNKNOWN';
 ```
 
-## Merging into table
+## Merge Into Table
 
 Paimon currently supports Merge Into syntax in Spark 3+, which allow a set of updates, insertions and deletions based on a source table in a single commit.
 
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
index 03026e8574295..977b74707069b 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/InsertOverwriteTableTestBase.scala
@@ -508,4 +508,56 @@ abstract class InsertOverwriteTableTestBase extends PaimonSparkTestBase {
         ) :: Nil
     )
   }
+
+  test("Paimon Insert: insert with column list") {
+    sql("CREATE TABLE T (name String, student_id INT) PARTITIONED BY (address STRING)")
+
+    // insert with a column list
+    sql("INSERT INTO T (name, student_id, address) VALUES ('a', '1', 'Hangzhou')")
+    // Since Spark 3.4, INSERT INTO commands with explicit column lists comprising fewer columns than the target
+    // table will automatically add the corresponding default values for the remaining columns (or NULL for any column
+    // lacking an explicitly-assigned default value). In Spark 3.3 or earlier, these commands would have failed.
+    // See https://issues.apache.org/jira/browse/SPARK-42521
+    if (gteqSpark3_4) {
+      sql("INSERT INTO T (name) VALUES ('b')")
+      sql("INSERT INTO T (address, name) VALUES ('Hangzhou', 'c')")
+    } else {
+      sql("INSERT INTO T (name, student_id, address) VALUES ('b', null, null)")
+      sql("INSERT INTO T (name, student_id, address) VALUES ('c', null, 'Hangzhou')")
+    }
+
+    // insert with both a partition spec and a column list
+    if (gteqSpark3_4) {
+      sql("INSERT INTO T PARTITION (address='Beijing') (name) VALUES ('d')")
+    } else {
+      sql("INSERT INTO T PARTITION (address='Beijing') (name, student_id) VALUES ('d', null)")
+    }
+    sql("INSERT INTO T PARTITION (address='Hangzhou') (student_id, name) VALUES (5, 'e')")
+
+    checkAnswer(
+      sql("SELECT * FROM T ORDER BY name"),
+      Seq(
+        Row("a", 1, "Hangzhou"),
+        Row("b", null, null),
+        Row("c", null, "Hangzhou"),
+        Row("d", null, "Beijing"),
+        Row("e", 5, "Hangzhou"))
+    )
+
+    // insert overwrite with a column list
+    if (gteqSpark3_4) {
+      sql("INSERT OVERWRITE T (name, address) VALUES ('f', 'Shanghai')")
+    } else {
+      sql("INSERT OVERWRITE T (name, student_id, address) VALUES ('f', null, 'Shanghai')")
+    }
+    checkAnswer(sql("SELECT * FROM T ORDER BY name"), Row("f", null, "Shanghai"))
+
+    // insert overwrite with both a partition spec and a column list
+    if (gteqSpark3_4) {
+      sql("INSERT OVERWRITE T PARTITION (address='Shanghai') (name) VALUES ('g')")
+    } else {
+      sql("INSERT OVERWRITE T PARTITION (address='Shanghai') (name, student_id) VALUES ('g', null)")
+    }
+    checkAnswer(sql("SELECT * FROM T ORDER BY name"), Row("g", null, "Shanghai"))
+  }
 }

From 318678804b6d1b12b520c77aa50894200676b616 Mon Sep 17 00:00:00 2001
From: askwang <135721692+askwang@users.noreply.github.com>
Date: Sat, 7 Dec 2024 00:17:59 +0800
Subject: [PATCH 116/157] [core] Expire partiitons add default delete num
 (#4652)

---
 .../generated/core_configuration.html         |  6 ++
 .../java/org/apache/paimon/CoreOptions.java   | 10 +++
 .../org/apache/paimon/AbstractFileStore.java  |  3 +-
 .../paimon/operation/PartitionExpire.java     | 27 +++++---
 .../procedure/ExpirePartitionsProcedure.java  |  5 +-
 .../flink/action/ExpirePartitionsAction.java  |  3 +-
 .../procedure/ExpirePartitionsProcedure.java  |  5 +-
 .../ExpirePartitionsProcedureITCase.java      | 37 +++++++++++
 .../procedure/ExpirePartitionsProcedure.java  |  5 +-
 .../ExpirePartitionsProcedureTest.scala       | 65 +++++++++++++++++++
 10 files changed, 150 insertions(+), 16 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 6fb2c72650feb..7d6bacccb0266 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -593,6 +593,12 @@
             <td>Duration</td>
             <td>The check interval of partition expiration.</td>
         </tr>
+        <tr>
+            <td><h5>partition.expiration-max-num</h5></td>
+            <td style="word-wrap: break-word;">100</td>
+            <td>Integer</td>
+            <td>The default deleted num of partition expiration.</td>
+        </tr>
         <tr>
             <td><h5>partition.expiration-strategy</h5></td>
             <td style="word-wrap: break-word;">values-time</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index 765d5a1e32d6b..8aebf2f289a00 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -809,6 +809,12 @@ public class CoreOptions implements Serializable {
                     .defaultValue(Duration.ofHours(1))
                     .withDescription("The check interval of partition expiration.");
 
+    public static final ConfigOption<Integer> PARTITION_EXPIRATION_MAX_NUM =
+            key("partition.expiration-max-num")
+                    .intType()
+                    .defaultValue(100)
+                    .withDescription("The default deleted num of partition expiration.");
+
     public static final ConfigOption<String> PARTITION_TIMESTAMP_FORMATTER =
             key("partition.timestamp-formatter")
                     .stringType()
@@ -2126,6 +2132,10 @@ public Duration partitionExpireCheckInterval() {
         return options.get(PARTITION_EXPIRATION_CHECK_INTERVAL);
     }
 
+    public int partitionExpireMaxNum() {
+        return options.get(PARTITION_EXPIRATION_MAX_NUM);
+    }
+
     public PartitionExpireStrategy partitionExpireStrategy() {
         return options.get(PARTITION_EXPIRATION_STRATEGY);
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
index 1a538ad89e479..54f554aa46d35 100644
--- a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
@@ -309,7 +309,8 @@ public PartitionExpire newPartitionExpire(String commitUser) {
                 newScan(),
                 newCommit(commitUser),
                 metastoreClient,
-                options.endInputCheckPartitionExpire());
+                options.endInputCheckPartitionExpire(),
+                options.partitionExpireMaxNum());
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/PartitionExpire.java b/paimon-core/src/main/java/org/apache/paimon/operation/PartitionExpire.java
index 62a9b796476ab..d432a37dfd9cc 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/PartitionExpire.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/PartitionExpire.java
@@ -54,7 +54,7 @@ public class PartitionExpire {
     private LocalDateTime lastCheck;
     private final PartitionExpireStrategy strategy;
     private final boolean endInputCheckPartitionExpire;
-    private int maxExpires;
+    private int maxExpireNum;
 
     public PartitionExpire(
             Duration expirationTime,
@@ -63,7 +63,8 @@ public PartitionExpire(
             FileStoreScan scan,
             FileStoreCommit commit,
             @Nullable MetastoreClient metastoreClient,
-            boolean endInputCheckPartitionExpire) {
+            boolean endInputCheckPartitionExpire,
+            int maxExpireNum) {
         this.expirationTime = expirationTime;
         this.checkInterval = checkInterval;
         this.strategy = strategy;
@@ -72,7 +73,7 @@ public PartitionExpire(
         this.metastoreClient = metastoreClient;
         this.lastCheck = LocalDateTime.now();
         this.endInputCheckPartitionExpire = endInputCheckPartitionExpire;
-        this.maxExpires = Integer.MAX_VALUE;
+        this.maxExpireNum = maxExpireNum;
     }
 
     public PartitionExpire(
@@ -81,8 +82,17 @@ public PartitionExpire(
             PartitionExpireStrategy strategy,
             FileStoreScan scan,
             FileStoreCommit commit,
-            @Nullable MetastoreClient metastoreClient) {
-        this(expirationTime, checkInterval, strategy, scan, commit, metastoreClient, false);
+            @Nullable MetastoreClient metastoreClient,
+            int maxExpireNum) {
+        this(
+                expirationTime,
+                checkInterval,
+                strategy,
+                scan,
+                commit,
+                metastoreClient,
+                false,
+                maxExpireNum);
     }
 
     public PartitionExpire withLock(Lock lock) {
@@ -90,8 +100,8 @@ public PartitionExpire withLock(Lock lock) {
         return this;
     }
 
-    public PartitionExpire withMaxExpires(int maxExpires) {
-        this.maxExpires = maxExpires;
+    public PartitionExpire withMaxExpireNum(int maxExpireNum) {
+        this.maxExpireNum = maxExpireNum;
         return this;
     }
 
@@ -145,6 +155,7 @@ private List<Map<String, String>> doExpire(
 
         List<Map<String, String>> expired = new ArrayList<>();
         if (!expiredPartValues.isEmpty()) {
+            // convert partition value to partition string, and limit the partition num
             expired = convertToPartitionString(expiredPartValues);
             LOG.info("Expire Partitions: {}", expired);
             if (metastoreClient != null) {
@@ -175,7 +186,7 @@ private List<Map<String, String>> convertToPartitionString(
                 .sorted()
                 .map(s -> s.split(DELIMITER))
                 .map(strategy::toPartitionString)
-                .limit(Math.min(expiredPartValues.size(), maxExpires))
+                .limit(Math.min(expiredPartValues.size(), maxExpireNum))
                 .collect(Collectors.toList());
     }
 }
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
index c0e5a65c49ef3..1c0d73cfbe386 100644
--- a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
@@ -93,9 +93,10 @@ public String[] call(
                                                 .catalogEnvironment()
                                                 .metastoreClientFactory())
                                 .map(MetastoreClient.Factory::create)
-                                .orElse(null));
+                                .orElse(null),
+                        fileStore.options().partitionExpireMaxNum());
         if (maxExpires != null) {
-            partitionExpire.withMaxExpires(maxExpires);
+            partitionExpire.withMaxExpireNum(maxExpires);
         }
         List<Map<String, String>> expired = partitionExpire.expire(Long.MAX_VALUE);
         return expired == null || expired.isEmpty()
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ExpirePartitionsAction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ExpirePartitionsAction.java
index 9528bc137d6f2..0fa17e1a8ddbe 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ExpirePartitionsAction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/action/ExpirePartitionsAction.java
@@ -72,7 +72,8 @@ public ExpirePartitionsAction(
                                                 .catalogEnvironment()
                                                 .metastoreClientFactory())
                                 .map(MetastoreClient.Factory::create)
-                                .orElse(null));
+                                .orElse(null),
+                        fileStore.options().partitionExpireMaxNum());
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
index ee6075a927d3f..ce282c6800cc1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedure.java
@@ -97,9 +97,10 @@ public String identifier() {
                                                 .catalogEnvironment()
                                                 .metastoreClientFactory())
                                 .map(MetastoreClient.Factory::create)
-                                .orElse(null));
+                                .orElse(null),
+                        fileStore.options().partitionExpireMaxNum());
         if (maxExpires != null) {
-            partitionExpire.withMaxExpires(maxExpires);
+            partitionExpire.withMaxExpireNum(maxExpires);
         }
         List<Map<String, String>> expired = partitionExpire.expire(Long.MAX_VALUE);
         return expired == null || expired.isEmpty()
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
index 2d1fb6dde78a2..a40968e067bca 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/ExpirePartitionsProcedureITCase.java
@@ -415,6 +415,43 @@ public void testNullPartitionExpire() {
                 .containsExactly("No expired partitions.");
     }
 
+    @Test
+    public void testExpirePartitionsWithDefaultNum() throws Exception {
+        sql(
+                "CREATE TABLE T ("
+                        + " k STRING,"
+                        + " dt STRING,"
+                        + " PRIMARY KEY (k, dt) NOT ENFORCED"
+                        + ") PARTITIONED BY (dt) WITH ("
+                        + " 'bucket' = '1',"
+                        + " 'partition.expiration-max-num'='2'"
+                        + ")");
+        FileStoreTable table = paimonTable("T");
+
+        sql("INSERT INTO T VALUES ('a', '2024-06-01')");
+        sql("INSERT INTO T VALUES ('b', '2024-06-02')");
+        sql("INSERT INTO T VALUES ('c', '2024-06-03')");
+        // This partition never expires.
+        sql("INSERT INTO T VALUES ('Never-expire', '9999-09-09')");
+        Function<InternalRow, String> consumerReadResult =
+                (InternalRow row) -> row.getString(0) + ":" + row.getString(1);
+
+        assertThat(read(table, consumerReadResult))
+                .containsExactlyInAnyOrder(
+                        "a:2024-06-01", "b:2024-06-02", "c:2024-06-03", "Never-expire:9999-09-09");
+
+        assertThat(
+                        callExpirePartitions(
+                                "CALL sys.expire_partitions("
+                                        + "`table` => 'default.T'"
+                                        + ", expiration_time => '1 d'"
+                                        + ", timestamp_formatter => 'yyyy-MM-dd')"))
+                .containsExactlyInAnyOrder("dt=2024-06-01", "dt=2024-06-02");
+
+        assertThat(read(table, consumerReadResult))
+                .containsExactlyInAnyOrder("c:2024-06-03", "Never-expire:9999-09-09");
+    }
+
     /** Return a list of expired partitions. */
     public List<String> callExpirePartitions(String callSql) {
         return sql(callSql).stream()
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/ExpirePartitionsProcedure.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/ExpirePartitionsProcedure.java
index 7b388227e5a4e..e3a53d2bd2efb 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/ExpirePartitionsProcedure.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/ExpirePartitionsProcedure.java
@@ -107,9 +107,10 @@ public InternalRow[] call(InternalRow args) {
                                                             .catalogEnvironment()
                                                             .metastoreClientFactory())
                                             .map(MetastoreClient.Factory::create)
-                                            .orElse(null));
+                                            .orElse(null),
+                                    fileStore.options().partitionExpireMaxNum());
                     if (maxExpires != null) {
-                        partitionExpire.withMaxExpires(maxExpires);
+                        partitionExpire.withMaxExpireNum(maxExpires);
                     }
                     List<Map<String, String>> expired = partitionExpire.expire(Long.MAX_VALUE);
                     return expired == null || expired.isEmpty()
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
index 4561e532f538d..9f0d23dc93794 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ExpirePartitionsProcedureTest.scala
@@ -551,4 +551,69 @@ class ExpirePartitionsProcedureTest extends PaimonSparkTestBase with StreamTest
       }
     }
   }
+
+  test("Paimon Procedure: expire partitions with default num") {
+    failAfter(streamingTimeout) {
+      withTempDir {
+        checkpointDir =>
+          spark.sql(
+            s"""
+               |CREATE TABLE T (k STRING, pt STRING)
+               |TBLPROPERTIES ('primary-key'='k,pt', 'bucket'='1', 'partition.expiration-max-num'='2')
+               |PARTITIONED BY (pt)
+               |""".stripMargin)
+          val location = loadTable("T").location().toString
+
+          val inputData = MemoryStream[(String, String)]
+          val stream = inputData
+            .toDS()
+            .toDF("k", "pt")
+            .writeStream
+            .option("checkpointLocation", checkpointDir.getCanonicalPath)
+            .foreachBatch {
+              (batch: Dataset[Row], _: Long) =>
+                batch.write.format("paimon").mode("append").save(location)
+            }
+            .start()
+
+          val query = () => spark.sql("SELECT * FROM T")
+
+          try {
+            // snapshot-1
+            inputData.addData(("a", "2024-06-01"))
+            stream.processAllAvailable()
+
+            // snapshot-2
+            inputData.addData(("b", "2024-06-02"))
+            stream.processAllAvailable()
+
+            // snapshot-3
+            inputData.addData(("c", "2024-06-03"))
+            stream.processAllAvailable()
+
+            // This partition never expires.
+            inputData.addData(("Never-expire", "9999-09-09"))
+            stream.processAllAvailable()
+
+            checkAnswer(
+              query(),
+              Row("a", "2024-06-01") :: Row("b", "2024-06-02") :: Row("c", "2024-06-03") :: Row(
+                "Never-expire",
+                "9999-09-09") :: Nil)
+            // call expire_partitions.
+            checkAnswer(
+              spark.sql(
+                "CALL paimon.sys.expire_partitions(table => 'test.T', expiration_time => '1 d'" +
+                  ", timestamp_formatter => 'yyyy-MM-dd')"),
+              Row("pt=2024-06-01") :: Row("pt=2024-06-02") :: Nil
+            )
+
+            checkAnswer(query(), Row("c", "2024-06-03") :: Row("Never-expire", "9999-09-09") :: Nil)
+
+          } finally {
+            stream.stop()
+          }
+      }
+    }
+  }
 }

From 8484bb4a25e5b1873cad1716bb6076d6f60913ed Mon Sep 17 00:00:00 2001
From: HunterXHunter <cnlingmingqiang@gmail.com>
Date: Sat, 7 Dec 2024 00:18:51 +0800
Subject: [PATCH 117/157] [flink] Optimizing parallelism for fixed bucekt and
 non-partitioned table (#4643)

---
 .../org/apache/paimon/flink/sink/FlinkSinkBuilder.java | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
index 5703c408243bd..ecaa5678dd0b1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/FlinkSinkBuilder.java
@@ -265,6 +265,16 @@ protected DataStreamSink<?> buildDynamicBucketSink(
     }
 
     protected DataStreamSink<?> buildForFixedBucket(DataStream<InternalRow> input) {
+        int bucketNums = table.bucketSpec().getNumBuckets();
+        if (parallelism == null
+                && bucketNums < input.getParallelism()
+                && table.partitionKeys().isEmpty()) {
+            // For non-partitioned table, if the bucketNums is less than job parallelism.
+            LOG.warn(
+                    "For non-partitioned table, if bucketNums is less than the parallelism of inputOperator,"
+                            + " then the parallelism of writerOperator will be set to bucketNums.");
+            parallelism = bucketNums;
+        }
         DataStream<InternalRow> partitioned =
                 partition(
                         input,

From 96100eb83e8a6a2faeeef4d6d092d7dbf885d02f Mon Sep 17 00:00:00 2001
From: herefree <841043203@qq.com>
Date: Sun, 8 Dec 2024 22:24:52 +0800
Subject: [PATCH 118/157] [flink] support flink sourceIdleTime metric in
 ReadOperator (#4644)

---
 .../metrics/FileStoreSourceReaderMetrics.java |  1 +
 .../flink/source/operator/ReadOperator.java   | 24 ++++++++++++++++++-
 .../source/operator/OperatorSourceTest.java   | 16 +++++++++++++
 3 files changed, 40 insertions(+), 1 deletion(-)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/metrics/FileStoreSourceReaderMetrics.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/metrics/FileStoreSourceReaderMetrics.java
index 2e1e947779491..a270e0eceecd0 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/metrics/FileStoreSourceReaderMetrics.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/metrics/FileStoreSourceReaderMetrics.java
@@ -29,6 +29,7 @@ public class FileStoreSourceReaderMetrics {
     private long lastSplitUpdateTime = UNDEFINED;
 
     public static final long UNDEFINED = -1L;
+    public static final long ACTIVE = Long.MAX_VALUE;
 
     public FileStoreSourceReaderMetrics(MetricGroup sourceReaderMetricGroup) {
         sourceReaderMetricGroup.gauge(
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
index 80c85f7cdb35a..d884724c67490 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
@@ -54,9 +54,11 @@ public class ReadOperator extends AbstractStreamOperator<RowData>
     private transient IOManager ioManager;
 
     private transient FileStoreSourceReaderMetrics sourceReaderMetrics;
-    // we create our own gauge for currentEmitEventTimeLag, because this operator is not a FLIP-27
+    // we create our own gauge for currentEmitEventTimeLag and sourceIdleTime, because this operator
+    // is not a FLIP-27
     // source and Flink can't automatically calculate this metric
     private transient long emitEventTimeLag = FileStoreSourceReaderMetrics.UNDEFINED;
+    private transient long idleStartTime = FileStoreSourceReaderMetrics.ACTIVE;
     private transient Counter numRecordsIn;
 
     public ReadOperator(ReadBuilder readBuilder) {
@@ -69,6 +71,7 @@ public void open() throws Exception {
 
         this.sourceReaderMetrics = new FileStoreSourceReaderMetrics(getMetricGroup());
         getMetricGroup().gauge(MetricNames.CURRENT_EMIT_EVENT_TIME_LAG, () -> emitEventTimeLag);
+        getMetricGroup().gauge(MetricNames.SOURCE_IDLE_TIME, this::getIdleTime);
         this.numRecordsIn =
                 InternalSourceReaderMetricGroup.wrap(getMetricGroup())
                         .getIOMetricGroup()
@@ -83,6 +86,7 @@ public void open() throws Exception {
         this.read = readBuilder.newRead().withIOManager(ioManager);
         this.reuseRow = new FlinkRowData(null);
         this.reuseRecord = new StreamRecord<>(reuseRow);
+        this.idlingStarted();
     }
 
     @Override
@@ -94,6 +98,8 @@ public void processElement(StreamRecord<Split> record) throws Exception {
                         .earliestFileCreationEpochMillis()
                         .orElse(FileStoreSourceReaderMetrics.UNDEFINED);
         sourceReaderMetrics.recordSnapshotUpdate(eventTime);
+        // update idleStartTime when reading a new split
+        idleStartTime = FileStoreSourceReaderMetrics.ACTIVE;
 
         boolean firstRecord = true;
         try (CloseableIterator<InternalRow> iterator =
@@ -113,6 +119,8 @@ public void processElement(StreamRecord<Split> record) throws Exception {
                 output.collect(reuseRecord);
             }
         }
+        // start idle when data sending is completed
+        this.idlingStarted();
     }
 
     @Override
@@ -122,4 +130,18 @@ public void close() throws Exception {
             ioManager.close();
         }
     }
+
+    private void idlingStarted() {
+        if (!isIdling()) {
+            idleStartTime = System.currentTimeMillis();
+        }
+    }
+
+    private boolean isIdling() {
+        return idleStartTime != FileStoreSourceReaderMetrics.ACTIVE;
+    }
+
+    private long getIdleTime() {
+        return isIdling() ? System.currentTimeMillis() - idleStartTime : 0;
+    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
index 61a03a29a21bd..0bce8c8901ea8 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
@@ -204,6 +204,14 @@ public void testReadOperatorMetricsRegisterAndUpdate() throws Exception {
                                 .getValue())
                 .isEqualTo(-1L);
 
+        Thread.sleep(300L);
+        assertThat(
+                        (Long)
+                                TestingMetricUtils.getGauge(
+                                                readerOperatorMetricGroup, "sourceIdleTime")
+                                        .getValue())
+                .isGreaterThan(299L);
+
         harness.processElement(new StreamRecord<>(splits.get(0)));
         assertThat(
                         (Long)
@@ -228,6 +236,14 @@ public void testReadOperatorMetricsRegisterAndUpdate() throws Exception {
                                                 "currentEmitEventTimeLag")
                                         .getValue())
                 .isEqualTo(emitEventTimeLag);
+
+        assertThat(
+                        (Long)
+                                TestingMetricUtils.getGauge(
+                                                readerOperatorMetricGroup, "sourceIdleTime")
+                                        .getValue())
+                .isGreaterThan(99L)
+                .isLessThan(300L);
     }
 
     private <T> T testReadSplit(

From e18f6ed6fde0f3b10170540aebefa0d437bb19aa Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Sun, 8 Dec 2024 22:46:44 +0800
Subject: [PATCH 119/157] [parquet] Fix minor format codes in parquet readers

---
 .../format/parquet/position/CollectionPosition.java      | 6 +++---
 .../paimon/format/parquet/position/LevelDelegation.java  | 1 +
 .../format/parquet/reader/AbstractColumnReader.java      | 5 +----
 .../format/parquet/reader/BooleanColumnReader.java       | 5 -----
 .../parquet/reader/NestedPrimitiveColumnReader.java      | 4 +---
 .../paimon/format/parquet/reader/ParquetReadState.java   | 9 +++------
 .../format/parquet/reader/TimestampColumnReader.java     | 5 +++--
 .../apache/paimon/format/parquet/type/ParquetField.java  | 1 +
 8 files changed, 13 insertions(+), 23 deletions(-)

diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/CollectionPosition.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/CollectionPosition.java
index e72a4280f4aa8..beb5de7a92e54 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/CollectionPosition.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/CollectionPosition.java
@@ -22,14 +22,14 @@
 
 /** To represent collection's position in repeated type. */
 public class CollectionPosition {
+
     @Nullable private final boolean[] isNull;
     private final long[] offsets;
-
     private final long[] length;
-
     private final int valueCount;
 
-    public CollectionPosition(boolean[] isNull, long[] offsets, long[] length, int valueCount) {
+    public CollectionPosition(
+            @Nullable boolean[] isNull, long[] offsets, long[] length, int valueCount) {
         this.isNull = isNull;
         this.offsets = offsets;
         this.length = length;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/LevelDelegation.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/LevelDelegation.java
index 25bbedc861d12..8e30d90ba2c7a 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/LevelDelegation.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/position/LevelDelegation.java
@@ -20,6 +20,7 @@
 
 /** To delegate repetition level and definition level. */
 public class LevelDelegation {
+
     private final int[] repetitionLevel;
     private final int[] definitionLevel;
 
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
index 5e3f4a7e6a336..d4a0ab039b536 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/AbstractColumnReader.java
@@ -69,9 +69,6 @@ public abstract class AbstractColumnReader<VECTOR extends WritableColumnVector>
     /** If true, the current page is dictionary encoded. */
     private boolean isCurrentPageDictionaryEncoded;
 
-    /** Total values in the current page. */
-    //    private int pageValueCount;
-
     /**
      * Helper struct to track intermediate states while reading Parquet pages in the column chunk.
      */
@@ -90,7 +87,7 @@ public abstract class AbstractColumnReader<VECTOR extends WritableColumnVector>
      */
 
     /** Run length decoder for data and dictionary. */
-    protected RunLengthDecoder runLenDecoder;
+    RunLengthDecoder runLenDecoder;
 
     /** Data input stream. */
     ByteBufferInputStream dataInputStream;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
index 83d3c5a07d4b6..4355392bf5520 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/BooleanColumnReader.java
@@ -42,11 +42,6 @@ public BooleanColumnReader(ColumnDescriptor descriptor, PageReadStore pageReadSt
         checkTypeName(PrimitiveType.PrimitiveTypeName.BOOLEAN);
     }
 
-    @Override
-    protected boolean supportLazyDecode() {
-        return true;
-    }
-
     @Override
     protected void afterReadPage() {
         bitOffset = 0;
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
index 7db7aedbf6aee..f0a82a6d711e8 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/NestedPrimitiveColumnReader.java
@@ -65,6 +65,7 @@
 
 /** Reader to read nested primitive column. */
 public class NestedPrimitiveColumnReader implements ColumnReader<WritableColumnVector> {
+
     private static final Logger LOG = LoggerFactory.getLogger(NestedPrimitiveColumnReader.class);
 
     private final IntArrayList repetitionLevelList = new IntArrayList(0);
@@ -95,9 +96,6 @@ public class NestedPrimitiveColumnReader implements ColumnReader<WritableColumnV
     private IntIterator definitionLevelColumn;
     private ParquetDataColumnReader dataColumn;
 
-    /** Total values in the current page. */
-    //    private int pageValueCount;
-
     /**
      * Helper struct to track intermediate states while reading Parquet pages in the column chunk.
      */
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java
index a6003676825a1..aa89ea9821442 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/ParquetReadState.java
@@ -25,6 +25,7 @@
 
 /** Parquet reader state for column index. */
 public class ParquetReadState {
+
     /** A special row range used when there is no row indexes (hence all rows must be included). */
     private static final RowRange MAX_ROW_RANGE = new RowRange(Long.MIN_VALUE, Long.MAX_VALUE);
 
@@ -105,15 +106,11 @@ public long currentRangeEnd() {
     }
 
     public boolean isFinished() {
-        return this.currentRange.equals(this.END_ROW_RANGE);
+        return this.currentRange.equals(END_ROW_RANGE);
     }
 
     public boolean isMaxRange() {
-        return this.currentRange.equals(this.MAX_ROW_RANGE);
-    }
-
-    public RowRange getCurrentRange() {
-        return currentRange;
+        return this.currentRange.equals(MAX_ROW_RANGE);
     }
 
     /** Advance to the next range. */
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
index 8767173315c24..d6ac96ea44586 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/reader/TimestampColumnReader.java
@@ -36,8 +36,9 @@
 
 /**
  * Timestamp {@link ColumnReader}. We only support INT96 bytes now, julianDay(4) + nanosOfDay(8).
- * See https://github.com/apache/parquet-format/blob/master/DataTypes.md#timestamp TIMESTAMP_MILLIS
- * and TIMESTAMP_MICROS are the deprecated ConvertedType.
+ * See <a
+ * href="https://github.com/apache/parquet-format/blob/master/LogicalTypes.md#timestamp">Parquet
+ * Timestamp</a> TIMESTAMP_MILLIS and TIMESTAMP_MICROS are the deprecated ConvertedType.
  */
 public class TimestampColumnReader extends AbstractColumnReader<WritableTimestampVector> {
 
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/parquet/type/ParquetField.java b/paimon-format/src/main/java/org/apache/paimon/format/parquet/type/ParquetField.java
index 94fe6b91d9d3c..291e9ebbceb33 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/parquet/type/ParquetField.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/parquet/type/ParquetField.java
@@ -22,6 +22,7 @@
 
 /** Field that represent parquet's field type. */
 public abstract class ParquetField {
+
     private final DataType type;
     private final int repetitionLevel;
     private final int definitionLevel;

From 9191e2e1f556bc91af7941046869a516c15d5fe8 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 9 Dec 2024 13:55:11 +0800
Subject: [PATCH 120/157] [core] Optimize memory usage for expiring snapshots
 and tags (#4655)

This closes #4655.
---
 .../paimon/manifest/ExpireFileEntry.java      | 86 ++++++++++++++++
 .../org/apache/paimon/manifest/FileEntry.java |  2 +
 .../apache/paimon/manifest/ManifestEntry.java |  5 +
 .../apache/paimon/manifest/ManifestFile.java  | 10 ++
 .../paimon/manifest/SimpleFileEntry.java      |  5 +
 .../paimon/operation/ChangelogDeletion.java   |  4 +-
 .../paimon/operation/FileDeletionBase.java    | 99 +++++++++----------
 .../paimon/operation/SnapshotDeletion.java    | 12 +--
 .../apache/paimon/operation/TagDeletion.java  | 17 ++--
 .../paimon/table/ExpireChangelogImpl.java     |  4 +-
 .../paimon/table/ExpireSnapshotsImpl.java     |  4 +-
 .../apache/paimon/table/RollbackHelper.java   |  4 +-
 .../org/apache/paimon/utils/TagManager.java   |  4 +-
 .../paimon/operation/ExpireSnapshotsTest.java |  5 +-
 14 files changed, 183 insertions(+), 78 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/manifest/ExpireFileEntry.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ExpireFileEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ExpireFileEntry.java
new file mode 100644
index 0000000000000..060360623cd09
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ExpireFileEntry.java
@@ -0,0 +1,86 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.manifest;
+
+import org.apache.paimon.data.BinaryRow;
+
+import javax.annotation.Nullable;
+
+import java.util.List;
+import java.util.Objects;
+import java.util.Optional;
+
+/** A {@link SimpleFileEntry} with {@link #fileSource}. */
+public class ExpireFileEntry extends SimpleFileEntry {
+
+    @Nullable private final FileSource fileSource;
+
+    public ExpireFileEntry(
+            FileKind kind,
+            BinaryRow partition,
+            int bucket,
+            int level,
+            String fileName,
+            List<String> extraFiles,
+            @Nullable byte[] embeddedIndex,
+            BinaryRow minKey,
+            BinaryRow maxKey,
+            @Nullable FileSource fileSource) {
+        super(kind, partition, bucket, level, fileName, extraFiles, embeddedIndex, minKey, maxKey);
+        this.fileSource = fileSource;
+    }
+
+    public Optional<FileSource> fileSource() {
+        return Optional.ofNullable(fileSource);
+    }
+
+    public static ExpireFileEntry from(ManifestEntry entry) {
+        return new ExpireFileEntry(
+                entry.kind(),
+                entry.partition(),
+                entry.bucket(),
+                entry.level(),
+                entry.fileName(),
+                entry.file().extraFiles(),
+                entry.file().embeddedIndex(),
+                entry.minKey(),
+                entry.maxKey(),
+                entry.file().fileSource().orElse(null));
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (o == null || getClass() != o.getClass()) {
+            return false;
+        }
+        if (!super.equals(o)) {
+            return false;
+        }
+        ExpireFileEntry that = (ExpireFileEntry) o;
+        return fileSource == that.fileSource;
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(super.hashCode(), fileSource);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
index 91e07a369da20..a2569beac61cb 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/FileEntry.java
@@ -60,6 +60,8 @@ public interface FileEntry {
 
     BinaryRow maxKey();
 
+    List<String> extraFiles();
+
     /**
      * The same {@link Identifier} indicates that the {@link ManifestEntry} refers to the same data
      * file.
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
index ee5dc2c344214..626e0a5d468ff 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestEntry.java
@@ -102,6 +102,11 @@ public BinaryRow maxKey() {
         return file.maxKey();
     }
 
+    @Override
+    public List<String> extraFiles() {
+        return file.extraFiles();
+    }
+
     public int totalBuckets() {
         return totalBuckets;
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
index 128f5262a5537..1aba2ef19561e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/ManifestFile.java
@@ -39,6 +39,7 @@
 import javax.annotation.Nullable;
 
 import java.io.IOException;
+import java.util.ArrayList;
 import java.util.List;
 
 /**
@@ -84,6 +85,15 @@ public long suggestedFileSize() {
         return suggestedFileSize;
     }
 
+    public List<ExpireFileEntry> readExpireFileEntries(String fileName, @Nullable Long fileSize) {
+        List<ManifestEntry> entries = read(fileName, fileSize);
+        List<ExpireFileEntry> result = new ArrayList<>(entries.size());
+        for (ManifestEntry entry : entries) {
+            result.add(ExpireFileEntry.from(entry));
+        }
+        return result;
+    }
+
     /**
      * Write several {@link ManifestEntry}s into manifest files.
      *
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/SimpleFileEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/SimpleFileEntry.java
index 8d33ede0c4a19..fdaed2b85aafd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/SimpleFileEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/SimpleFileEntry.java
@@ -117,6 +117,11 @@ public BinaryRow maxKey() {
         return maxKey;
     }
 
+    @Override
+    public List<String> extraFiles() {
+        return extraFiles;
+    }
+
     @Override
     public boolean equals(Object o) {
         if (this == o) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/ChangelogDeletion.java b/paimon-core/src/main/java/org/apache/paimon/operation/ChangelogDeletion.java
index c20405ff26c96..069e57bb3daf6 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/ChangelogDeletion.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/ChangelogDeletion.java
@@ -23,8 +23,8 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.index.IndexFileHandler;
 import org.apache.paimon.index.IndexFileMeta;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.manifest.IndexManifestEntry;
-import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.manifest.ManifestList;
@@ -60,7 +60,7 @@ public ChangelogDeletion(
     }
 
     @Override
-    public void cleanUnusedDataFiles(Changelog changelog, Predicate<ManifestEntry> skipper) {
+    public void cleanUnusedDataFiles(Changelog changelog, Predicate<ExpireFileEntry> skipper) {
         if (changelog.changelogManifestList() != null) {
             deleteAddedDataFiles(changelog.changelogManifestList());
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileDeletionBase.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileDeletionBase.java
index 303a074b0cb89..cfecd767b6fb0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileDeletionBase.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileDeletionBase.java
@@ -24,10 +24,11 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.index.IndexFileHandler;
 import org.apache.paimon.index.IndexFileMeta;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.manifest.FileEntry;
+import org.apache.paimon.manifest.FileEntry.Identifier;
 import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.IndexManifestEntry;
-import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestFileMeta;
 import org.apache.paimon.manifest.ManifestList;
@@ -46,7 +47,6 @@
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
-import java.util.LinkedList;
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
@@ -54,7 +54,6 @@
 import java.util.concurrent.Executor;
 import java.util.function.Consumer;
 import java.util.function.Predicate;
-import java.util.stream.Collectors;
 
 /**
  * Base class for file deletion including methods for clean data files, manifest files and empty
@@ -110,7 +109,7 @@ public FileDeletionBase(
      * @param skipper if the test result of a data file is true, it will be skipped when deleting;
      *     else it will be deleted
      */
-    public abstract void cleanUnusedDataFiles(T snapshot, Predicate<ManifestEntry> skipper);
+    public abstract void cleanUnusedDataFiles(T snapshot, Predicate<ExpireFileEntry> skipper);
 
     /**
      * Clean metadata files that will not be used anymore of a snapshot, including data manifests,
@@ -164,21 +163,23 @@ public void cleanEmptyDirectories() {
         deletionBuckets.clear();
     }
 
-    protected void recordDeletionBuckets(ManifestEntry entry) {
+    protected void recordDeletionBuckets(ExpireFileEntry entry) {
         deletionBuckets
                 .computeIfAbsent(entry.partition(), p -> new HashSet<>())
                 .add(entry.bucket());
     }
 
-    public void cleanUnusedDataFiles(String manifestList, Predicate<ManifestEntry> skipper) {
+    public void cleanUnusedDataFiles(String manifestList, Predicate<ExpireFileEntry> skipper) {
         // try read manifests
-        List<String> manifestFileNames = readManifestFileNames(tryReadManifestList(manifestList));
-        List<ManifestEntry> manifestEntries;
+        List<ManifestFileMeta> manifests = tryReadManifestList(manifestList);
+        List<ExpireFileEntry> manifestEntries;
         // data file path -> (original manifest entry, extra file paths)
-        Map<Path, Pair<ManifestEntry, List<Path>>> dataFileToDelete = new HashMap<>();
-        for (String manifest : manifestFileNames) {
+        Map<Path, Pair<ExpireFileEntry, List<Path>>> dataFileToDelete = new HashMap<>();
+        for (ManifestFileMeta manifest : manifests) {
             try {
-                manifestEntries = manifestFile.read(manifest);
+                manifestEntries =
+                        manifestFile.readExpireFileEntries(
+                                manifest.fileName(), manifest.fileSize());
             } catch (Exception e) {
                 // cancel deletion if any exception occurs
                 LOG.warn("Failed to read some manifest files. Cancel deletion.", e);
@@ -192,12 +193,12 @@ public void cleanUnusedDataFiles(String manifestList, Predicate<ManifestEntry> s
     }
 
     protected void doCleanUnusedDataFile(
-            Map<Path, Pair<ManifestEntry, List<Path>>> dataFileToDelete,
-            Predicate<ManifestEntry> skipper) {
+            Map<Path, Pair<ExpireFileEntry, List<Path>>> dataFileToDelete,
+            Predicate<ExpireFileEntry> skipper) {
         List<Path> actualDataFileToDelete = new ArrayList<>();
         dataFileToDelete.forEach(
                 (path, pair) -> {
-                    ManifestEntry entry = pair.getLeft();
+                    ExpireFileEntry entry = pair.getLeft();
                     // check whether we should skip the data file
                     if (!skipper.test(entry)) {
                         // delete data files
@@ -211,20 +212,20 @@ protected void doCleanUnusedDataFile(
     }
 
     protected void getDataFileToDelete(
-            Map<Path, Pair<ManifestEntry, List<Path>>> dataFileToDelete,
-            List<ManifestEntry> dataFileEntries) {
+            Map<Path, Pair<ExpireFileEntry, List<Path>>> dataFileToDelete,
+            List<ExpireFileEntry> dataFileEntries) {
         // we cannot delete a data file directly when we meet a DELETE entry, because that
         // file might be upgraded
-        for (ManifestEntry entry : dataFileEntries) {
+        for (ExpireFileEntry entry : dataFileEntries) {
             Path bucketPath = pathFactory.bucketPath(entry.partition(), entry.bucket());
-            Path dataFilePath = new Path(bucketPath, entry.file().fileName());
+            Path dataFilePath = new Path(bucketPath, entry.fileName());
             switch (entry.kind()) {
                 case ADD:
                     dataFileToDelete.remove(dataFilePath);
                     break;
                 case DELETE:
-                    List<Path> extraFiles = new ArrayList<>(entry.file().extraFiles().size());
-                    for (String file : entry.file().extraFiles()) {
+                    List<Path> extraFiles = new ArrayList<>(entry.extraFiles().size());
+                    for (String file : entry.extraFiles()) {
                         extraFiles.add(new Path(bucketPath, file));
                     }
                     dataFileToDelete.put(dataFilePath, Pair.of(entry, extraFiles));
@@ -242,27 +243,28 @@ protected void getDataFileToDelete(
      * @param manifestListName name of manifest list
      */
     public void deleteAddedDataFiles(String manifestListName) {
-        List<String> manifestFileNames =
-                readManifestFileNames(tryReadManifestList(manifestListName));
-        for (String file : manifestFileNames) {
+        List<ManifestFileMeta> manifests = tryReadManifestList(manifestListName);
+        for (ManifestFileMeta manifest : manifests) {
             try {
-                List<ManifestEntry> manifestEntries = manifestFile.read(file);
+                List<ExpireFileEntry> manifestEntries =
+                        manifestFile.readExpireFileEntries(
+                                manifest.fileName(), manifest.fileSize());
                 deleteAddedDataFiles(manifestEntries);
             } catch (Exception e) {
                 // We want to delete the data file, so just ignore the unavailable files
-                LOG.info("Failed to read manifest " + file + ". Ignore it.", e);
+                LOG.info("Failed to read manifest " + manifest.fileName() + ". Ignore it.", e);
             }
         }
     }
 
-    private void deleteAddedDataFiles(List<ManifestEntry> manifestEntries) {
+    private void deleteAddedDataFiles(List<ExpireFileEntry> manifestEntries) {
         List<Path> dataFileToDelete = new ArrayList<>();
-        for (ManifestEntry entry : manifestEntries) {
+        for (ExpireFileEntry entry : manifestEntries) {
             if (entry.kind() == FileKind.ADD) {
                 dataFileToDelete.add(
                         new Path(
                                 pathFactory.bucketPath(entry.partition(), entry.bucket()),
-                                entry.file().fileName()));
+                                entry.fileName()));
                 recordDeletionBuckets(entry);
             }
         }
@@ -327,7 +329,7 @@ protected void cleanUnusedManifests(
         cleanUnusedStatisticsManifests(snapshot, skippingSet);
     }
 
-    public Predicate<ManifestEntry> createDataFileSkipperForTags(
+    public Predicate<ExpireFileEntry> createDataFileSkipperForTags(
             List<Snapshot> taggedSnapshots, long expiringSnapshotId) throws Exception {
         int index = SnapshotManager.findPreviousSnapshot(taggedSnapshots, expiringSnapshotId);
         // refresh tag data files
@@ -358,18 +360,6 @@ protected List<ManifestFileMeta> tryReadManifestList(String manifestListName) {
         }
     }
 
-    protected List<String> tryReadDataManifests(Snapshot snapshot) {
-        List<ManifestFileMeta> manifestFileMetas = tryReadManifestList(snapshot.baseManifestList());
-        manifestFileMetas.addAll(tryReadManifestList(snapshot.deltaManifestList()));
-        return readManifestFileNames(manifestFileMetas);
-    }
-
-    protected List<String> readManifestFileNames(List<ManifestFileMeta> manifestFileMetas) {
-        return manifestFileMetas.stream()
-                .map(ManifestFileMeta::fileName)
-                .collect(Collectors.toCollection(LinkedList::new));
-    }
-
     /**
      * NOTE: This method is used for building data file skipping set. If failed to read some
      * manifests, it will throw exception which callers must handle.
@@ -377,23 +367,26 @@ protected List<String> readManifestFileNames(List<ManifestFileMeta> manifestFile
     protected void addMergedDataFiles(
             Map<BinaryRow, Map<Integer, Set<String>>> dataFiles, Snapshot snapshot)
             throws IOException {
-        for (ManifestEntry entry : readMergedDataFiles(snapshot)) {
+        for (ExpireFileEntry entry : readMergedDataFiles(snapshot)) {
             dataFiles
                     .computeIfAbsent(entry.partition(), p -> new HashMap<>())
                     .computeIfAbsent(entry.bucket(), b -> new HashSet<>())
-                    .add(entry.file().fileName());
+                    .add(entry.fileName());
         }
     }
 
-    protected Collection<ManifestEntry> readMergedDataFiles(Snapshot snapshot) throws IOException {
+    protected Collection<ExpireFileEntry> readMergedDataFiles(Snapshot snapshot)
+            throws IOException {
         // read data manifests
-        List<String> files = tryReadDataManifests(snapshot);
+
+        List<ManifestFileMeta> manifests = tryReadManifestList(snapshot.baseManifestList());
+        manifests.addAll(tryReadManifestList(snapshot.deltaManifestList()));
 
         // read and merge manifest entries
-        Map<ManifestEntry.Identifier, ManifestEntry> map = new HashMap<>();
-        for (String manifest : files) {
-            List<ManifestEntry> entries;
-            entries = manifestFile.readWithIOException(manifest);
+        Map<Identifier, ExpireFileEntry> map = new HashMap<>();
+        for (ManifestFileMeta manifest : manifests) {
+            List<ExpireFileEntry> entries =
+                    manifestFile.readExpireFileEntries(manifest.fileName(), manifest.fileSize());
             FileEntry.mergeEntries(entries, map);
         }
 
@@ -401,12 +394,12 @@ protected Collection<ManifestEntry> readMergedDataFiles(Snapshot snapshot) throw
     }
 
     protected boolean containsDataFile(
-            Map<BinaryRow, Map<Integer, Set<String>>> dataFiles, ManifestEntry testee) {
-        Map<Integer, Set<String>> buckets = dataFiles.get(testee.partition());
+            Map<BinaryRow, Map<Integer, Set<String>>> dataFiles, ExpireFileEntry entry) {
+        Map<Integer, Set<String>> buckets = dataFiles.get(entry.partition());
         if (buckets != null) {
-            Set<String> fileNames = buckets.get(testee.bucket());
+            Set<String> fileNames = buckets.get(entry.bucket());
             if (fileNames != null) {
-                return fileNames.contains(testee.file().fileName());
+                return fileNames.contains(entry.fileName());
             }
         }
         return false;
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/SnapshotDeletion.java b/paimon-core/src/main/java/org/apache/paimon/operation/SnapshotDeletion.java
index d86907ecea546..7d55b64c8eac5 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/SnapshotDeletion.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/SnapshotDeletion.java
@@ -23,8 +23,8 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.index.IndexFileHandler;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.manifest.FileSource;
-import org.apache.paimon.manifest.ManifestEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestList;
 import org.apache.paimon.stats.StatsFileHandler;
@@ -65,15 +65,15 @@ public SnapshotDeletion(
     }
 
     @Override
-    public void cleanUnusedDataFiles(Snapshot snapshot, Predicate<ManifestEntry> skipper) {
+    public void cleanUnusedDataFiles(Snapshot snapshot, Predicate<ExpireFileEntry> skipper) {
         if (changelogDecoupled && !produceChangelog) {
             // Skip clean the 'APPEND' data files.If we do not have the file source information
             // eg: the old version table file, we just skip clean this here, let it done by
             // ExpireChangelogImpl
-            Predicate<ManifestEntry> enriched =
+            Predicate<ExpireFileEntry> enriched =
                     manifestEntry ->
                             skipper.test(manifestEntry)
-                                    || (manifestEntry.file().fileSource().orElse(FileSource.APPEND)
+                                    || (manifestEntry.fileSource().orElse(FileSource.APPEND)
                                             == FileSource.APPEND);
             cleanUnusedDataFiles(snapshot.deltaManifestList(), enriched);
         } else {
@@ -92,8 +92,8 @@ public void cleanUnusedManifests(Snapshot snapshot, Set<String> skippingSet) {
     }
 
     @VisibleForTesting
-    void cleanUnusedDataFile(List<ManifestEntry> dataFileLog) {
-        Map<Path, Pair<ManifestEntry, List<Path>>> dataFileToDelete = new HashMap<>();
+    void cleanUnusedDataFile(List<ExpireFileEntry> dataFileLog) {
+        Map<Path, Pair<ExpireFileEntry, List<Path>>> dataFileToDelete = new HashMap<>();
         getDataFileToDelete(dataFileToDelete, dataFileLog);
         doCleanUnusedDataFile(dataFileToDelete, f -> false);
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/TagDeletion.java b/paimon-core/src/main/java/org/apache/paimon/operation/TagDeletion.java
index a6cd338d5859c..2722ed0c7ec81 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/TagDeletion.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/TagDeletion.java
@@ -23,7 +23,7 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.index.IndexFileHandler;
-import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.manifest.ManifestFile;
 import org.apache.paimon.manifest.ManifestList;
 import org.apache.paimon.stats.StatsFileHandler;
@@ -68,8 +68,8 @@ public TagDeletion(
     }
 
     @Override
-    public void cleanUnusedDataFiles(Snapshot taggedSnapshot, Predicate<ManifestEntry> skipper) {
-        Collection<ManifestEntry> manifestEntries;
+    public void cleanUnusedDataFiles(Snapshot taggedSnapshot, Predicate<ExpireFileEntry> skipper) {
+        Collection<ExpireFileEntry> manifestEntries;
         try {
             manifestEntries = readMergedDataFiles(taggedSnapshot);
         } catch (IOException e) {
@@ -78,11 +78,11 @@ public void cleanUnusedDataFiles(Snapshot taggedSnapshot, Predicate<ManifestEntr
         }
 
         Set<Path> dataFileToDelete = new HashSet<>();
-        for (ManifestEntry entry : manifestEntries) {
+        for (ExpireFileEntry entry : manifestEntries) {
             if (!skipper.test(entry)) {
                 Path bucketPath = pathFactory.bucketPath(entry.partition(), entry.bucket());
-                dataFileToDelete.add(new Path(bucketPath, entry.file().fileName()));
-                for (String file : entry.file().extraFiles()) {
+                dataFileToDelete.add(new Path(bucketPath, entry.fileName()));
+                for (String file : entry.extraFiles()) {
                     dataFileToDelete.add(new Path(bucketPath, file));
                 }
 
@@ -98,11 +98,12 @@ public void cleanUnusedManifests(Snapshot taggedSnapshot, Set<String> skippingSe
         cleanUnusedManifests(taggedSnapshot, skippingSet, true, false);
     }
 
-    public Predicate<ManifestEntry> dataFileSkipper(Snapshot fromSnapshot) throws Exception {
+    public Predicate<ExpireFileEntry> dataFileSkipper(Snapshot fromSnapshot) throws Exception {
         return dataFileSkipper(Collections.singletonList(fromSnapshot));
     }
 
-    public Predicate<ManifestEntry> dataFileSkipper(List<Snapshot> fromSnapshots) throws Exception {
+    public Predicate<ExpireFileEntry> dataFileSkipper(List<Snapshot> fromSnapshots)
+            throws Exception {
         Map<BinaryRow, Map<Integer, Set<String>>> skipped = new HashMap<>();
         for (Snapshot snapshot : fromSnapshots) {
             addMergedDataFiles(skipped, snapshot);
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/ExpireChangelogImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/ExpireChangelogImpl.java
index ce54975450559..1ffa7485aee5d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/ExpireChangelogImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/ExpireChangelogImpl.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.Changelog;
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.consumer.ConsumerManager;
-import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.operation.ChangelogDeletion;
 import org.apache.paimon.options.ExpireConfig;
 import org.apache.paimon.utils.Preconditions;
@@ -147,7 +147,7 @@ public int expireUntil(long earliestId, long endExclusiveId) {
                 LOG.debug("Ready to delete changelog files from changelog #" + id);
             }
             Changelog changelog = snapshotManager.longLivedChangelog(id);
-            Predicate<ManifestEntry> skipper;
+            Predicate<ExpireFileEntry> skipper;
             try {
                 skipper = changelogDeletion.createDataFileSkipperForTags(taggedSnapshots, id);
             } catch (Exception e) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/ExpireSnapshotsImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/ExpireSnapshotsImpl.java
index 2c83b63c97ef5..dc1c2d6bdbc5d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/ExpireSnapshotsImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/ExpireSnapshotsImpl.java
@@ -22,7 +22,7 @@
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.consumer.ConsumerManager;
-import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.operation.SnapshotDeletion;
 import org.apache.paimon.options.ExpireConfig;
 import org.apache.paimon.utils.Preconditions;
@@ -176,7 +176,7 @@ public int expireUntil(long earliestId, long endExclusiveId) {
                 continue;
             }
             // expire merge tree files and collect changed buckets
-            Predicate<ManifestEntry> skipper;
+            Predicate<ExpireFileEntry> skipper;
             try {
                 skipper = snapshotDeletion.createDataFileSkipperForTags(taggedSnapshots, id);
             } catch (Exception e) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/RollbackHelper.java b/paimon-core/src/main/java/org/apache/paimon/table/RollbackHelper.java
index 1eb4ccf001362..29fecec113536 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/RollbackHelper.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/RollbackHelper.java
@@ -21,7 +21,7 @@
 import org.apache.paimon.Changelog;
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.fs.FileIO;
-import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.operation.ChangelogDeletion;
 import org.apache.paimon.operation.SnapshotDeletion;
 import org.apache.paimon.operation.TagDeletion;
@@ -205,7 +205,7 @@ private List<Snapshot> cleanTagsDataFiles(Snapshot retainedSnapshot) {
         }
 
         // delete data files
-        Predicate<ManifestEntry> dataFileSkipper = null;
+        Predicate<ExpireFileEntry> dataFileSkipper = null;
         boolean success = true;
         try {
             dataFileSkipper = tagDeletion.dataFileSkipper(retainedSnapshot);
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
index 1e05a100d741c..4019395d8d65a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/TagManager.java
@@ -23,7 +23,7 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.FileStatus;
 import org.apache.paimon.fs.Path;
-import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.operation.TagDeletion;
 import org.apache.paimon.table.sink.TagCallback;
 import org.apache.paimon.tag.Tag;
@@ -255,7 +255,7 @@ private void doClean(
         skippedSnapshots.add(right);
 
         // delete data files and empty directories
-        Predicate<ManifestEntry> dataFileSkipper = null;
+        Predicate<ExpireFileEntry> dataFileSkipper = null;
         boolean success = true;
         try {
             dataFileSkipper = tagDeletion.dataFileSkipper(skippedSnapshots);
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
index 96dce3d78426a..9dc98343734b0 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/ExpireSnapshotsTest.java
@@ -29,6 +29,7 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.io.DataFileMeta;
+import org.apache.paimon.manifest.ExpireFileEntry;
 import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.FileSource;
 import org.apache.paimon.manifest.ManifestEntry;
@@ -218,7 +219,9 @@ public void testExpireExtraFiles() throws IOException {
         ManifestEntry delete = new ManifestEntry(FileKind.DELETE, partition, 0, 1, dataFile);
 
         // expire
-        expire.snapshotDeletion().cleanUnusedDataFile(Arrays.asList(add, delete));
+        expire.snapshotDeletion()
+                .cleanUnusedDataFile(
+                        Arrays.asList(ExpireFileEntry.from(add), ExpireFileEntry.from(delete)));
 
         // check
         assertThat(fileIO.exists(myDataFile)).isFalse();

From bfa0c5ccc5cce4879fa93538f4a47ab1096e8229 Mon Sep 17 00:00:00 2001
From: askwang <135721692+askwang@users.noreply.github.com>
Date: Mon, 9 Dec 2024 14:00:26 +0800
Subject: [PATCH 121/157] [spark] Paimon parser only resolve own supported
 procedures (#4662)

---
 .../apache/paimon/spark/SparkProcedures.java  |  5 +++
 ...stractPaimonSparkSqlExtensionsParser.scala | 13 ++++++-
 .../extensions/CallStatementParserTest.java   | 39 +++++++++++++++----
 .../spark/procedure/ProcedureTestBase.scala   |  4 +-
 4 files changed, 50 insertions(+), 11 deletions(-)

diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
index 35b65a7b530b8..21f14e5d7a38e 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
@@ -48,6 +48,7 @@
 
 import java.util.Locale;
 import java.util.Map;
+import java.util.Set;
 import java.util.function.Supplier;
 
 /** The {@link Procedure}s including all the stored procedures. */
@@ -62,6 +63,10 @@ public static ProcedureBuilder newBuilder(String name) {
         return builderSupplier != null ? builderSupplier.get() : null;
     }
 
+    public static Set<String> names() {
+        return BUILDERS.keySet();
+    }
+
     private static Map<String, Supplier<ProcedureBuilder>> initProcedureBuilders() {
         ImmutableMap.Builder<String, Supplier<ProcedureBuilder>> procedureBuilders =
                 ImmutableMap.builder();
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
index c1d61e9738344..557b0735c74d7 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/spark/sql/catalyst/parser/extensions/AbstractPaimonSparkSqlExtensionsParser.scala
@@ -18,6 +18,8 @@
 
 package org.apache.spark.sql.catalyst.parser.extensions
 
+import org.apache.paimon.spark.SparkProcedures
+
 import org.antlr.v4.runtime._
 import org.antlr.v4.runtime.atn.PredictionMode
 import org.antlr.v4.runtime.misc.{Interval, ParseCancellationException}
@@ -34,6 +36,8 @@ import org.apache.spark.sql.types.{DataType, StructType}
 
 import java.util.Locale
 
+import scala.collection.JavaConverters._
+
 /* This file is based on source code from the Iceberg Project (http://iceberg.apache.org/), licensed by the Apache
  * Software Foundation (ASF) under the Apache License, Version 2.0. See the NOTICE file distributed with this work for
  * additional information regarding copyright ownership. */
@@ -100,8 +104,15 @@ abstract class AbstractPaimonSparkSqlExtensionsParser(val delegate: ParserInterf
       .replaceAll("--.*?\\n", " ")
       .replaceAll("\\s+", " ")
       .replaceAll("/\\*.*?\\*/", " ")
+      .replaceAll("`", "")
       .trim()
-    normalized.startsWith("call") || isTagRefDdl(normalized)
+    isPaimonProcedure(normalized) || isTagRefDdl(normalized)
+  }
+
+  // All builtin paimon procedures are under the 'sys' namespace
+  private def isPaimonProcedure(normalized: String): Boolean = {
+    normalized.startsWith("call") &&
+    SparkProcedures.names().asScala.map("sys." + _).exists(normalized.contains)
   }
 
   private def isTagRefDdl(normalized: String): Boolean = {
diff --git a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
index 61e06016cbd34..e4e571e96bc95 100644
--- a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
+++ b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/extensions/CallStatementParserTest.java
@@ -79,14 +79,37 @@ public void stopSparkSession() {
         }
     }
 
+    @Test
+    public void testDelegateUnsupportedProcedure() {
+        assertThatThrownBy(() -> parser.parsePlan("CALL cat.d.t()"))
+                .isInstanceOf(ParseException.class)
+                .satisfies(
+                        exception -> {
+                            ParseException parseException = (ParseException) exception;
+                            assertThat(parseException.getErrorClass())
+                                    .isEqualTo("PARSE_SYNTAX_ERROR");
+                            assertThat(parseException.getMessageParameters().get("error"))
+                                    .isEqualTo("'CALL'");
+                        });
+    }
+
+    @Test
+    public void testCallWithBackticks() throws ParseException {
+        PaimonCallStatement call =
+                (PaimonCallStatement) parser.parsePlan("CALL cat.`sys`.`rollback`()");
+        assertThat(JavaConverters.seqAsJavaList(call.name()))
+                .isEqualTo(Arrays.asList("cat", "sys", "rollback"));
+        assertThat(call.args().size()).isEqualTo(0);
+    }
+
     @Test
     public void testCallWithNamedArguments() throws ParseException {
         PaimonCallStatement callStatement =
                 (PaimonCallStatement)
                         parser.parsePlan(
-                                "CALL catalog.system.named_args_func(arg1 => 1, arg2 => 'test', arg3 => true)");
+                                "CALL catalog.sys.rollback(arg1 => 1, arg2 => 'test', arg3 => true)");
         assertThat(JavaConverters.seqAsJavaList(callStatement.name()))
-                .isEqualTo(Arrays.asList("catalog", "system", "named_args_func"));
+                .isEqualTo(Arrays.asList("catalog", "sys", "rollback"));
         assertThat(callStatement.args().size()).isEqualTo(3);
         assertArgument(callStatement, 0, "arg1", 1, DataTypes.IntegerType);
         assertArgument(callStatement, 1, "arg2", "test", DataTypes.StringType);
@@ -98,11 +121,11 @@ public void testCallWithPositionalArguments() throws ParseException {
         PaimonCallStatement callStatement =
                 (PaimonCallStatement)
                         parser.parsePlan(
-                                "CALL catalog.system.positional_args_func(1, '${spark.sql.extensions}', 2L, true, 3.0D, 4"
+                                "CALL catalog.sys.rollback(1, '${spark.sql.extensions}', 2L, true, 3.0D, 4"
                                         + ".0e1,500e-1BD, "
                                         + "TIMESTAMP '2017-02-03T10:37:30.00Z')");
         assertThat(JavaConverters.seqAsJavaList(callStatement.name()))
-                .isEqualTo(Arrays.asList("catalog", "system", "positional_args_func"));
+                .isEqualTo(Arrays.asList("catalog", "sys", "rollback"));
         assertThat(callStatement.args().size()).isEqualTo(8);
         assertArgument(callStatement, 0, 1, DataTypes.IntegerType);
         assertArgument(
@@ -127,9 +150,9 @@ public void testCallWithPositionalArguments() throws ParseException {
     public void testCallWithMixedArguments() throws ParseException {
         PaimonCallStatement callStatement =
                 (PaimonCallStatement)
-                        parser.parsePlan("CALL catalog.system.mixed_function(arg1 => 1, 'test')");
+                        parser.parsePlan("CALL catalog.sys.rollback(arg1 => 1, 'test')");
         assertThat(JavaConverters.seqAsJavaList(callStatement.name()))
-                .isEqualTo(Arrays.asList("catalog", "system", "mixed_function"));
+                .isEqualTo(Arrays.asList("catalog", "sys", "rollback"));
         assertThat(callStatement.args().size()).isEqualTo(2);
         assertArgument(callStatement, 0, "arg1", 1, DataTypes.IntegerType);
         assertArgument(callStatement, 1, "test", DataTypes.StringType);
@@ -137,9 +160,9 @@ public void testCallWithMixedArguments() throws ParseException {
 
     @Test
     public void testCallWithParseException() {
-        assertThatThrownBy(() -> parser.parsePlan("CALL catalog.system func abc"))
+        assertThatThrownBy(() -> parser.parsePlan("CALL catalog.sys.rollback abc"))
                 .isInstanceOf(PaimonParseException.class)
-                .hasMessageContaining("missing '(' at 'func'");
+                .hasMessageContaining("missing '(' at 'abc'");
     }
 
     private void assertArgument(
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
index f3cb7fa266657..a5f9f3ffa01b2 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/procedure/ProcedureTestBase.scala
@@ -19,8 +19,8 @@
 package org.apache.paimon.spark.procedure
 
 import org.apache.paimon.spark.PaimonSparkTestBase
-import org.apache.paimon.spark.analysis.NoSuchProcedureException
 
+import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.parser.extensions.PaimonParseException
 import org.assertj.core.api.Assertions.assertThatThrownBy
 
@@ -32,7 +32,7 @@ abstract class ProcedureTestBase extends PaimonSparkTestBase {
                  |""".stripMargin)
 
     assertThatThrownBy(() => spark.sql("CALL sys.unknown_procedure(table => 'test.T')"))
-      .isInstanceOf(classOf[NoSuchProcedureException])
+      .isInstanceOf(classOf[ParseException])
   }
 
   test(s"test parse exception") {

From ed4356330a9718ac26a4fe86d5ec61bf804315bd Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 9 Dec 2024 14:03:38 +0800
Subject: [PATCH 122/157] [core] Optimize overwrite commit to use CommitResult
 to retry (#4661)

This closes #4661.
---
 .../paimon/operation/FileStoreCommitImpl.java | 109 +++++++-----------
 1 file changed, 42 insertions(+), 67 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index 4808975fa763c..43faadc4d8ec3 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -747,9 +747,7 @@ private int tryCommit(
             retryResult = (RetryResult) result;
 
             if (retryCount >= commitMaxRetries) {
-                if (retryResult != null) {
-                    retryResult.cleanAll();
-                }
+                retryResult.cleanAll();
                 throw new RuntimeException(
                         String.format(
                                 "Commit failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
@@ -767,75 +765,52 @@ private int tryOverwrite(
             long identifier,
             @Nullable Long watermark,
             Map<Integer, Long> logOffsets) {
-        int retryCount = 0;
-        while (true) {
-            Snapshot latestSnapshot = snapshotManager.latestSnapshot();
-
-            List<ManifestEntry> changesWithOverwrite = new ArrayList<>();
-            List<IndexManifestEntry> indexChangesWithOverwrite = new ArrayList<>();
-            if (latestSnapshot != null) {
-                List<ManifestEntry> currentEntries =
-                        scan.withSnapshot(latestSnapshot)
-                                .withPartitionFilter(partitionFilter)
-                                .withKind(ScanMode.ALL)
-                                .plan()
-                                .files();
-                for (ManifestEntry entry : currentEntries) {
-                    changesWithOverwrite.add(
-                            new ManifestEntry(
-                                    FileKind.DELETE,
-                                    entry.partition(),
-                                    entry.bucket(),
-                                    entry.totalBuckets(),
-                                    entry.file()));
-                }
+        // collect all files with overwrite
+        Snapshot latestSnapshot = snapshotManager.latestSnapshot();
+        List<ManifestEntry> changesWithOverwrite = new ArrayList<>();
+        List<IndexManifestEntry> indexChangesWithOverwrite = new ArrayList<>();
+        if (latestSnapshot != null) {
+            List<ManifestEntry> currentEntries =
+                    scan.withSnapshot(latestSnapshot)
+                            .withPartitionFilter(partitionFilter)
+                            .withKind(ScanMode.ALL)
+                            .plan()
+                            .files();
+            for (ManifestEntry entry : currentEntries) {
+                changesWithOverwrite.add(
+                        new ManifestEntry(
+                                FileKind.DELETE,
+                                entry.partition(),
+                                entry.bucket(),
+                                entry.totalBuckets(),
+                                entry.file()));
+            }
 
-                // collect index files
-                if (latestSnapshot.indexManifest() != null) {
-                    List<IndexManifestEntry> entries =
-                            indexManifestFile.read(latestSnapshot.indexManifest());
-                    for (IndexManifestEntry entry : entries) {
-                        if (partitionFilter == null || partitionFilter.test(entry.partition())) {
-                            indexChangesWithOverwrite.add(entry.toDeleteEntry());
-                        }
+            // collect index files
+            if (latestSnapshot.indexManifest() != null) {
+                List<IndexManifestEntry> entries =
+                        indexManifestFile.read(latestSnapshot.indexManifest());
+                for (IndexManifestEntry entry : entries) {
+                    if (partitionFilter == null || partitionFilter.test(entry.partition())) {
+                        indexChangesWithOverwrite.add(entry.toDeleteEntry());
                     }
                 }
             }
-            changesWithOverwrite.addAll(changes);
-            indexChangesWithOverwrite.addAll(indexFiles);
-
-            CommitResult result =
-                    tryCommitOnce(
-                            null,
-                            changesWithOverwrite,
-                            Collections.emptyList(),
-                            indexChangesWithOverwrite,
-                            identifier,
-                            watermark,
-                            logOffsets,
-                            Snapshot.CommitKind.OVERWRITE,
-                            latestSnapshot,
-                            mustConflictCheck(),
-                            branchName,
-                            null);
-
-            if (result.isSuccess()) {
-                break;
-            }
-
-            // TODO optimize OVERWRITE too
-            RetryResult retryResult = (RetryResult) result;
-            retryResult.cleanAll();
-
-            if (retryCount >= commitMaxRetries) {
-                throw new RuntimeException(
-                        String.format(
-                                "Commit failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
-                                commitMaxRetries));
-            }
-            retryCount++;
         }
-        return retryCount + 1;
+        changesWithOverwrite.addAll(changes);
+        indexChangesWithOverwrite.addAll(indexFiles);
+
+        return tryCommit(
+                changesWithOverwrite,
+                Collections.emptyList(),
+                indexChangesWithOverwrite,
+                identifier,
+                watermark,
+                logOffsets,
+                Snapshot.CommitKind.OVERWRITE,
+                mustConflictCheck(),
+                branchName,
+                null);
     }
 
     @VisibleForTesting

From 55e4e740128a10a9352be0af7906fb6c7d3bcda9 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Mon, 9 Dec 2024 16:41:38 +0800
Subject: [PATCH 123/157] [core] Optimize drop partitions to avoid stack
 overflow (#4663)

This closes #4663.
---
 .../utils/InternalRowPartitionComputer.java   | 18 +++++++++++
 .../paimon/operation/FileStoreCommitImpl.java | 32 ++++++++++++-------
 .../paimon/partition/PartitionPredicate.java  | 15 +++++++++
 3 files changed, 54 insertions(+), 11 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/InternalRowPartitionComputer.java b/paimon-common/src/main/java/org/apache/paimon/utils/InternalRowPartitionComputer.java
index 8de2720a26e98..6bb26d76138e2 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/InternalRowPartitionComputer.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/InternalRowPartitionComputer.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.casting.CastExecutor;
 import org.apache.paimon.casting.CastExecutors;
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.data.InternalRow.FieldGetter;
 import org.apache.paimon.types.DataType;
@@ -32,6 +33,7 @@
 import java.util.Map;
 
 import static org.apache.paimon.utils.InternalRowUtils.createNullCheckingFieldGetter;
+import static org.apache.paimon.utils.Preconditions.checkArgument;
 import static org.apache.paimon.utils.TypeUtils.castFromString;
 
 /** PartitionComputer for {@link InternalRow}. */
@@ -102,6 +104,22 @@ public static Map<String, Object> convertSpecToInternal(
         return partValues;
     }
 
+    public static GenericRow convertSpecToInternalRow(
+            Map<String, String> spec, RowType partType, String defaultPartValue) {
+        checkArgument(spec.size() == partType.getFieldCount());
+        GenericRow partRow = new GenericRow(spec.size());
+        List<String> fieldNames = partType.getFieldNames();
+        for (Map.Entry<String, String> entry : spec.entrySet()) {
+            Object value =
+                    defaultPartValue.equals(entry.getValue())
+                            ? null
+                            : castFromString(
+                                    entry.getValue(), partType.getField(entry.getKey()).type());
+            partRow.setField(fieldNames.indexOf(entry.getKey()), value);
+        }
+        return partRow;
+    }
+
     public static String partToSimpleString(
             RowType partitionType, BinaryRow partition, String delimiter, int maxLength) {
         FieldGetter[] getters = partitionType.fieldGetters();
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index 43faadc4d8ec3..547c6e29be471 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -83,6 +83,7 @@
 import static org.apache.paimon.manifest.ManifestEntry.recordCount;
 import static org.apache.paimon.manifest.ManifestEntry.recordCountAdd;
 import static org.apache.paimon.manifest.ManifestEntry.recordCountDelete;
+import static org.apache.paimon.partition.PartitionPredicate.createBinaryPartitions;
 import static org.apache.paimon.partition.PartitionPredicate.createPartitionPredicate;
 import static org.apache.paimon.utils.BranchManager.DEFAULT_MAIN_BRANCH;
 import static org.apache.paimon.utils.InternalRowPartitionComputer.partToSimpleString;
@@ -530,17 +531,26 @@ public void dropPartitions(List<Map<String, String>> partitions, long commitIden
                     partitions.stream().map(Objects::toString).collect(Collectors.joining(",")));
         }
 
-        // partitions may be partial partition fields, so here must to use predicate way.
-        Predicate predicate =
-                partitions.stream()
-                        .map(
-                                partition ->
-                                        createPartitionPredicate(
-                                                partition, partitionType, partitionDefaultName))
-                        .reduce(PredicateBuilder::or)
-                        .orElseThrow(() -> new RuntimeException("Failed to get partition filter."));
-        PartitionPredicate partitionFilter =
-                PartitionPredicate.fromPredicate(partitionType, predicate);
+        boolean fullMode =
+                partitions.stream().allMatch(part -> part.size() == partitionType.getFieldCount());
+        PartitionPredicate partitionFilter;
+        if (fullMode) {
+            List<BinaryRow> binaryPartitions =
+                    createBinaryPartitions(partitions, partitionType, partitionDefaultName);
+            partitionFilter = PartitionPredicate.fromMultiple(partitionType, binaryPartitions);
+        } else {
+            // partitions may be partial partition fields, so here must to use predicate way.
+            Predicate predicate =
+                    partitions.stream()
+                            .map(
+                                    partition ->
+                                            createPartitionPredicate(
+                                                    partition, partitionType, partitionDefaultName))
+                            .reduce(PredicateBuilder::or)
+                            .orElseThrow(
+                                    () -> new RuntimeException("Failed to get partition filter."));
+            partitionFilter = PartitionPredicate.fromPredicate(partitionType, predicate);
+        }
 
         tryOverwrite(
                 partitionFilter,
diff --git a/paimon-core/src/main/java/org/apache/paimon/partition/PartitionPredicate.java b/paimon-core/src/main/java/org/apache/paimon/partition/PartitionPredicate.java
index 12ea884be15fb..1f6c2cfe454e4 100644
--- a/paimon-core/src/main/java/org/apache/paimon/partition/PartitionPredicate.java
+++ b/paimon-core/src/main/java/org/apache/paimon/partition/PartitionPredicate.java
@@ -19,8 +19,10 @@
 package org.apache.paimon.partition;
 
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalArray;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.serializer.InternalRowSerializer;
 import org.apache.paimon.data.serializer.InternalSerializers;
 import org.apache.paimon.data.serializer.Serializer;
 import org.apache.paimon.format.SimpleColStats;
@@ -33,6 +35,7 @@
 
 import javax.annotation.Nullable;
 
+import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
@@ -40,6 +43,7 @@
 import java.util.Set;
 
 import static org.apache.paimon.utils.InternalRowPartitionComputer.convertSpecToInternal;
+import static org.apache.paimon.utils.InternalRowPartitionComputer.convertSpecToInternalRow;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
 import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
@@ -231,4 +235,15 @@ static Predicate createPartitionPredicate(
                         .map(p -> createPartitionPredicate(p, rowType, defaultPartValue))
                         .toArray(Predicate[]::new));
     }
+
+    static List<BinaryRow> createBinaryPartitions(
+            List<Map<String, String>> partitions, RowType partitionType, String defaultPartValue) {
+        InternalRowSerializer serializer = new InternalRowSerializer(partitionType);
+        List<BinaryRow> result = new ArrayList<>();
+        for (Map<String, String> spec : partitions) {
+            GenericRow row = convertSpecToInternalRow(spec, partitionType, defaultPartValue);
+            result.add(serializer.toBinaryRow(row).copy());
+        }
+        return result;
+    }
 }

From 80b68c225d1580d7461fdee1fb9da9d09dd542f6 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Tue, 10 Dec 2024 10:02:49 +0800
Subject: [PATCH 124/157] [hive] Make HiveMetastoreClient.addPartition thread
 safe (#4669)

---
 .../metastore/AddPartitionCommitCallback.java | 14 -----------
 .../paimon/hive/HiveMetastoreClient.java      | 25 ++++++++-----------
 2 files changed, 10 insertions(+), 29 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/metastore/AddPartitionCommitCallback.java b/paimon-core/src/main/java/org/apache/paimon/metastore/AddPartitionCommitCallback.java
index 06002161a68e4..599f88e512c03 100644
--- a/paimon-core/src/main/java/org/apache/paimon/metastore/AddPartitionCommitCallback.java
+++ b/paimon-core/src/main/java/org/apache/paimon/metastore/AddPartitionCommitCallback.java
@@ -72,20 +72,6 @@ public void retry(ManifestCommittable committable) {
         addPartitions(partitions);
     }
 
-    private void addPartition(BinaryRow partition) {
-        try {
-            boolean added = cache.get(partition, () -> false);
-            if (added) {
-                return;
-            }
-
-            client.addPartition(partition);
-            cache.put(partition, true);
-        } catch (Exception e) {
-            throw new RuntimeException(e);
-        }
-    }
-
     private void addPartitions(Set<BinaryRow> partitions) {
         try {
             List<BinaryRow> newPartitions = new ArrayList<>();
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
index cb70e01911456..3793c86f82693 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
@@ -31,6 +31,7 @@
 
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hadoop.hive.metastore.IMetaStoreClient;
+import org.apache.hadoop.hive.metastore.api.AlreadyExistsException;
 import org.apache.hadoop.hive.metastore.api.NoSuchObjectException;
 import org.apache.hadoop.hive.metastore.api.Partition;
 import org.apache.hadoop.hive.metastore.api.PartitionEventType;
@@ -92,21 +93,15 @@ public void addPartitions(List<BinaryRow> partitions) throws Exception {
 
     @Override
     public void addPartition(LinkedHashMap<String, String> partitionSpec) throws Exception {
-        List<String> partitionValues = new ArrayList<>(partitionSpec.values());
-        try {
-            clients.execute(
-                    client ->
-                            client.getPartition(
-                                    identifier.getDatabaseName(),
-                                    identifier.getTableName(),
-                                    partitionValues));
-            // do nothing if the partition already exists
-        } catch (NoSuchObjectException e) {
-            // partition not found, create new partition
-            Partition hivePartition =
-                    toHivePartition(partitionSpec, (int) (System.currentTimeMillis() / 1000));
-            clients.execute(client -> client.add_partition(hivePartition));
-        }
+        Partition hivePartition =
+                toHivePartition(partitionSpec, (int) (System.currentTimeMillis() / 1000));
+        clients.execute(
+                client -> {
+                    try {
+                        client.add_partition(hivePartition);
+                    } catch (AlreadyExistsException ignore) {
+                    }
+                });
     }
 
     @Override

From 704291824ed39c1d98d57c959ccbf333d05f6c2c Mon Sep 17 00:00:00 2001
From: lining <lining.jln@alibaba-inc.com>
Date: Tue, 10 Dec 2024 10:07:30 +0800
Subject: [PATCH 125/157] [core] Support auth in REST Catalog (#4648)

---
 .../apache/paimon/utils/ThreadPoolUtils.java  |  10 ++
 .../org/apache/paimon/rest/RESTCatalog.java   |  51 +++++--
 .../rest/RESTCatalogInternalOptions.java      |   5 +
 .../paimon/rest/RESTCatalogOptions.java       |  24 ++-
 .../apache/paimon/rest/auth/AuthSession.java  | 137 ++++++++++++++++++
 .../BaseBearTokenCredentialsProvider.java     |  37 +++++
 .../auth/BearTokenCredentialsProvider.java    |  39 +++++
 .../BearTokenCredentialsProviderFactory.java  |  43 ++++++
 .../BearTokenFileCredentialsProvider.java     | 106 ++++++++++++++
 ...arTokenFileCredentialsProviderFactory.java |  48 ++++++
 .../paimon/rest/auth/CredentialsProvider.java |  50 +++++++
 .../rest/auth/CredentialsProviderFactory.java |  54 +++++++
 .../rest/auth/CredentialsProviderType.java    |  25 ++++
 .../org.apache.paimon.factories.Factory       |   2 +
 .../apache/paimon/rest/HttpClientTest.java    |   9 +-
 .../paimon/rest/auth/AuthSessionTest.java     | 130 +++++++++++++++++
 .../auth/CredentialsProviderFactoryTest.java  | 131 +++++++++++++++++
 17 files changed, 881 insertions(+), 20 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/BaseBearTokenCredentialsProvider.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProvider.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProviderFactory.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProvider.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProviderFactory.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProvider.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderFactory.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderType.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/auth/CredentialsProviderFactoryTest.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
index f8959def67d13..c64b9e26ea6e0 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
 import org.apache.paimon.shade.guava30.com.google.common.collect.Lists;
+import org.apache.paimon.shade.guava30.com.google.common.util.concurrent.ThreadFactoryBuilder;
 
 import javax.annotation.Nullable;
 
@@ -36,6 +37,8 @@
 import java.util.concurrent.Executors;
 import java.util.concurrent.Future;
 import java.util.concurrent.LinkedBlockingQueue;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.ScheduledThreadPoolExecutor;
 import java.util.concurrent.SynchronousQueue;
 import java.util.concurrent.ThreadPoolExecutor;
 import java.util.concurrent.TimeUnit;
@@ -76,6 +79,13 @@ public static ThreadPoolExecutor createCachedThreadPool(
         return executor;
     }
 
+    public static ScheduledExecutorService createScheduledThreadPool(
+            int threadNum, String namePrefix) {
+        return new ScheduledThreadPoolExecutor(
+                threadNum,
+                new ThreadFactoryBuilder().setDaemon(true).setNameFormat(namePrefix).build());
+    }
+
     /** This method aims to parallel process tasks with memory control and sequentially. */
     public static <T, U> Iterable<T> sequentialBatchedExecute(
             ThreadPoolExecutor executor,
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
index c96400831370c..e18946b3374b7 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
@@ -18,7 +18,6 @@
 
 package org.apache.paimon.rest;
 
-import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.Database;
 import org.apache.paimon.catalog.Identifier;
@@ -27,37 +26,42 @@
 import org.apache.paimon.manifest.PartitionEntry;
 import org.apache.paimon.options.CatalogOptions;
 import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.auth.AuthSession;
+import org.apache.paimon.rest.auth.CredentialsProvider;
+import org.apache.paimon.rest.auth.CredentialsProviderFactory;
 import org.apache.paimon.rest.responses.ConfigResponse;
 import org.apache.paimon.schema.Schema;
 import org.apache.paimon.schema.SchemaChange;
 import org.apache.paimon.table.Table;
 
-import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.shade.guava30.com.google.common.annotations.VisibleForTesting;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
 import java.time.Duration;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
+import java.util.concurrent.ScheduledExecutorService;
+
+import static org.apache.paimon.utils.ThreadPoolUtils.createScheduledThreadPool;
 
 /** A catalog implementation for REST. */
 public class RESTCatalog implements Catalog {
     private RESTClient client;
-    private String token;
     private ResourcePaths resourcePaths;
     private Map<String, String> options;
     private Map<String, String> baseHeader;
+    // a lazy thread pool for token refresh
+    private final AuthSession catalogAuth;
+    private volatile ScheduledExecutorService refreshExecutor = null;
 
     private static final ObjectMapper objectMapper = RESTObjectMapper.create();
-    static final String AUTH_HEADER = "Authorization";
-    static final String AUTH_HEADER_VALUE_FORMAT = "Bearer %s";
 
     public RESTCatalog(Options options) {
         if (options.getOptional(CatalogOptions.WAREHOUSE).isPresent()) {
             throw new IllegalArgumentException("Can not config warehouse in RESTCatalog.");
         }
         String uri = options.get(RESTCatalogOptions.URI);
-        token = options.get(RESTCatalogOptions.TOKEN);
         Optional<Duration> connectTimeout =
                 options.getOptional(RESTCatalogOptions.CONNECTION_TIMEOUT);
         Optional<Duration> readTimeout = options.getOptional(RESTCatalogOptions.READ_TIMEOUT);
@@ -71,12 +75,21 @@ public RESTCatalog(Options options) {
                         threadPoolSize,
                         DefaultErrorHandler.getInstance());
         this.client = new HttpClient(httpClientOptions);
-        Map<String, String> authHeaders =
-                ImmutableMap.of(AUTH_HEADER, String.format(AUTH_HEADER_VALUE_FORMAT, token));
+        this.baseHeader = configHeaders(options.toMap());
+        CredentialsProvider credentialsProvider =
+                CredentialsProviderFactory.createCredentialsProvider(
+                        options, RESTCatalog.class.getClassLoader());
+        if (credentialsProvider.keepRefreshed()) {
+            this.catalogAuth =
+                    AuthSession.fromRefreshCredentialsProvider(
+                            tokenRefreshExecutor(), this.baseHeader, credentialsProvider);
+
+        } else {
+            this.catalogAuth = new AuthSession(this.baseHeader, credentialsProvider);
+        }
         Map<String, String> initHeaders =
-                RESTUtil.merge(configHeaders(options.toMap()), authHeaders);
+                RESTUtil.merge(configHeaders(options.toMap()), this.catalogAuth.getHeaders());
         this.options = fetchOptionsFromServer(initHeaders, options.toMap());
-        this.baseHeader = configHeaders(this.options());
         this.resourcePaths =
                 ResourcePaths.forCatalogProperties(
                         this.options.get(RESTCatalogInternalOptions.PREFIX));
@@ -187,11 +200,27 @@ public void close() throws Exception {}
     Map<String, String> fetchOptionsFromServer(
             Map<String, String> headers, Map<String, String> clientProperties) {
         ConfigResponse response =
-                client.get(ResourcePaths.V1_CONFIG, ConfigResponse.class, headers);
+                client.get(ResourcePaths.V1_CONFIG, ConfigResponse.class, headers());
         return response.merge(clientProperties);
     }
 
     private static Map<String, String> configHeaders(Map<String, String> properties) {
         return RESTUtil.extractPrefixMap(properties, "header.");
     }
+
+    private Map<String, String> headers() {
+        return catalogAuth.getHeaders();
+    }
+
+    private ScheduledExecutorService tokenRefreshExecutor() {
+        if (refreshExecutor == null) {
+            synchronized (this) {
+                if (refreshExecutor == null) {
+                    this.refreshExecutor = createScheduledThreadPool(1, "token-refresh-thread");
+                }
+            }
+        }
+
+        return refreshExecutor;
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
index cf61caa20e887..62a8bf134ae58 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
@@ -28,4 +28,9 @@ public class RESTCatalogInternalOptions {
                     .stringType()
                     .noDefaultValue()
                     .withDescription("REST Catalog uri's prefix.");
+    public static final ConfigOption<String> CREDENTIALS_PROVIDER =
+            ConfigOptions.key("credentials-provider")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog auth credentials provider.");
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
index 6155b893751b1..8f7bea91dcd35 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
@@ -30,11 +30,6 @@ public class RESTCatalogOptions {
                     .stringType()
                     .noDefaultValue()
                     .withDescription("REST Catalog server's uri.");
-    public static final ConfigOption<String> TOKEN =
-            ConfigOptions.key("token")
-                    .stringType()
-                    .noDefaultValue()
-                    .withDescription("REST Catalog server's auth token.");
     public static final ConfigOption<Duration> CONNECTION_TIMEOUT =
             ConfigOptions.key("rest.client.connection-timeout")
                     .durationType()
@@ -50,4 +45,23 @@ public class RESTCatalogOptions {
                     .intType()
                     .defaultValue(1)
                     .withDescription("REST Catalog http client thread num.");
+    public static final ConfigOption<String> TOKEN =
+            ConfigOptions.key("token")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog auth token.");
+    public static final ConfigOption<Duration> TOKEN_EXPIRATION_TIME =
+            ConfigOptions.key("token.expiration-time")
+                    .durationType()
+                    .defaultValue(Duration.ofHours(1))
+                    .withDescription(
+                            "REST Catalog auth token expires time.The token generates system refresh frequency is t1,"
+                                    + " the token expires time is t2, we need to guarantee that t2 > t1,"
+                                    + " the token validity time is [t2 - t1, t2],"
+                                    + " and the expires time defined here needs to be less than (t2 - t1)");
+    public static final ConfigOption<String> TOKEN_PROVIDER_PATH =
+            ConfigOptions.key("token.provider.path")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("REST Catalog auth token provider path.");
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
new file mode 100644
index 0000000000000..74efb8508a068
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
@@ -0,0 +1,137 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.annotation.VisibleForTesting;
+import org.apache.paimon.rest.RESTUtil;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import java.util.Map;
+import java.util.Optional;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.TimeUnit;
+
+/** Auth session. */
+public class AuthSession {
+
+    static final int TOKEN_REFRESH_NUM_RETRIES = 5;
+    private static final Logger log = LoggerFactory.getLogger(AuthSession.class);
+    private static final long MAX_REFRESH_WINDOW_MILLIS = 300_000; // 5 minutes
+    private static final long MIN_REFRESH_WAIT_MILLIS = 10;
+    private final CredentialsProvider credentialsProvider;
+    private volatile Map<String, String> headers;
+
+    public AuthSession(Map<String, String> headers, CredentialsProvider credentialsProvider) {
+        this.headers = headers;
+        this.credentialsProvider = credentialsProvider;
+    }
+
+    public static AuthSession fromRefreshCredentialsProvider(
+            ScheduledExecutorService executor,
+            Map<String, String> headers,
+            CredentialsProvider credentialsProvider) {
+        AuthSession session = new AuthSession(headers, credentialsProvider);
+
+        long startTimeMillis = System.currentTimeMillis();
+        Optional<Long> expiresAtMillisOpt = credentialsProvider.expiresAtMillis();
+
+        // when init session if credentials expire time is in the past, refresh it and update
+        // expiresAtMillis
+        if (expiresAtMillisOpt.isPresent() && expiresAtMillisOpt.get() <= startTimeMillis) {
+            boolean refreshSuccessful = session.refresh();
+            if (refreshSuccessful) {
+                expiresAtMillisOpt = session.credentialsProvider.expiresAtMillis();
+            }
+        }
+
+        if (null != executor && expiresAtMillisOpt.isPresent()) {
+            scheduleTokenRefresh(executor, session, expiresAtMillisOpt.get());
+        }
+
+        return session;
+    }
+
+    public Map<String, String> getHeaders() {
+        if (this.credentialsProvider.keepRefreshed() && this.credentialsProvider.willSoonExpire()) {
+            refresh();
+        }
+        return headers;
+    }
+
+    @VisibleForTesting
+    static void scheduleTokenRefresh(
+            ScheduledExecutorService executor, AuthSession session, long expiresAtMillis) {
+        scheduleTokenRefresh(executor, session, expiresAtMillis, 0);
+    }
+
+    private static void scheduleTokenRefresh(
+            ScheduledExecutorService executor,
+            AuthSession session,
+            long expiresAtMillis,
+            int retryTimes) {
+        if (retryTimes < TOKEN_REFRESH_NUM_RETRIES) {
+            long expiresInMillis = expiresAtMillis - System.currentTimeMillis();
+            // how much ahead of time to start the refresh to allow it to complete
+            long refreshWindowMillis = Math.min(expiresInMillis, MAX_REFRESH_WINDOW_MILLIS);
+            // how much time to wait before expiration
+            long waitIntervalMillis = expiresInMillis - refreshWindowMillis;
+            // how much time to actually wait
+            long timeToWait = Math.max(waitIntervalMillis, MIN_REFRESH_WAIT_MILLIS);
+
+            executor.schedule(
+                    () -> {
+                        long refreshStartTime = System.currentTimeMillis();
+                        boolean isSuccessful = session.refresh();
+                        if (isSuccessful) {
+                            scheduleTokenRefresh(
+                                    executor,
+                                    session,
+                                    refreshStartTime
+                                            + session.credentialsProvider.expiresInMills().get(),
+                                    0);
+                        } else {
+                            scheduleTokenRefresh(
+                                    executor, session, expiresAtMillis, retryTimes + 1);
+                        }
+                    },
+                    timeToWait,
+                    TimeUnit.MILLISECONDS);
+        } else {
+            log.warn("Failed to refresh token after {} retries.", TOKEN_REFRESH_NUM_RETRIES);
+        }
+    }
+
+    public Boolean refresh() {
+        if (this.credentialsProvider.supportRefresh()
+                && this.credentialsProvider.keepRefreshed()
+                && this.credentialsProvider.expiresInMills().isPresent()) {
+            boolean isSuccessful = this.credentialsProvider.refresh();
+            if (isSuccessful) {
+                Map<String, String> currentHeaders = this.headers;
+                this.headers =
+                        RESTUtil.merge(currentHeaders, this.credentialsProvider.authHeader());
+            }
+            return isSuccessful;
+        }
+
+        return false;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/BaseBearTokenCredentialsProvider.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BaseBearTokenCredentialsProvider.java
new file mode 100644
index 0000000000000..d3df878261645
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BaseBearTokenCredentialsProvider.java
@@ -0,0 +1,37 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+
+import java.util.Map;
+
+/** Base bear token credentials provider. */
+public abstract class BaseBearTokenCredentialsProvider implements CredentialsProvider {
+
+    private static final String AUTHORIZATION_HEADER = "Authorization";
+    private static final String BEARER_PREFIX = "Bearer ";
+
+    @Override
+    public Map<String, String> authHeader() {
+        return ImmutableMap.of(AUTHORIZATION_HEADER, BEARER_PREFIX + token());
+    }
+
+    abstract String token();
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProvider.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProvider.java
new file mode 100644
index 0000000000000..89228fe10b287
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProvider.java
@@ -0,0 +1,39 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+/** credentials provider for bear token. */
+public class BearTokenCredentialsProvider extends BaseBearTokenCredentialsProvider {
+
+    private final String token;
+
+    public BearTokenCredentialsProvider(String token) {
+        this.token = token;
+    }
+
+    @Override
+    String token() {
+        return this.token;
+    }
+
+    @Override
+    public boolean refresh() {
+        return true;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProviderFactory.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProviderFactory.java
new file mode 100644
index 0000000000000..e63ac5606b01c
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenCredentialsProviderFactory.java
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.RESTCatalogOptions;
+import org.apache.paimon.utils.StringUtils;
+
+/** factory for create {@link BearTokenCredentialsProvider}. */
+public class BearTokenCredentialsProviderFactory implements CredentialsProviderFactory {
+
+    @Override
+    public String identifier() {
+        return CredentialsProviderType.BEAR_TOKEN.name();
+    }
+
+    @Override
+    public CredentialsProvider create(Options options) {
+        if (options.getOptional(RESTCatalogOptions.TOKEN)
+                .map(StringUtils::isNullOrWhitespaceOnly)
+                .orElse(true)) {
+            throw new IllegalArgumentException(
+                    RESTCatalogOptions.TOKEN.key() + " is required and not empty");
+        }
+        return new BearTokenCredentialsProvider(options.get(RESTCatalogOptions.TOKEN));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProvider.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProvider.java
new file mode 100644
index 0000000000000..d479caa67fd0e
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProvider.java
@@ -0,0 +1,106 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.utils.FileIOUtils;
+import org.apache.paimon.utils.StringUtils;
+
+import java.io.File;
+import java.io.IOException;
+import java.io.UncheckedIOException;
+import java.util.Optional;
+
+/** credentials provider for get bear token from file. */
+public class BearTokenFileCredentialsProvider extends BaseBearTokenCredentialsProvider {
+
+    public static final double EXPIRED_FACTOR = 0.4;
+
+    private final String tokenFilePath;
+    private String token;
+    private boolean keepRefreshed = false;
+    private Long expiresAtMillis = null;
+    private Long expiresInMills = null;
+
+    public BearTokenFileCredentialsProvider(String tokenFilePath) {
+        this.tokenFilePath = tokenFilePath;
+        this.token = getTokenFromFile();
+    }
+
+    public BearTokenFileCredentialsProvider(String tokenFilePath, Long expiresInMills) {
+        this(tokenFilePath);
+        this.keepRefreshed = true;
+        this.expiresAtMillis = -1L;
+        this.expiresInMills = expiresInMills;
+    }
+
+    @Override
+    String token() {
+        return this.token;
+    }
+
+    @Override
+    public boolean refresh() {
+        long start = System.currentTimeMillis();
+        String newToken = getTokenFromFile();
+        if (StringUtils.isNullOrWhitespaceOnly(newToken)) {
+            return false;
+        }
+        this.expiresAtMillis = start + this.expiresInMills;
+        this.token = newToken;
+        return true;
+    }
+
+    @Override
+    public boolean supportRefresh() {
+        return true;
+    }
+
+    @Override
+    public boolean keepRefreshed() {
+        return this.keepRefreshed;
+    }
+
+    @Override
+    public boolean willSoonExpire() {
+        if (keepRefreshed()) {
+            return expiresAtMillis().get() - System.currentTimeMillis()
+                    < expiresInMills().get() * EXPIRED_FACTOR;
+        } else {
+            return false;
+        }
+    }
+
+    @Override
+    public Optional<Long> expiresAtMillis() {
+        return Optional.ofNullable(this.expiresAtMillis);
+    }
+
+    @Override
+    public Optional<Long> expiresInMills() {
+        return Optional.ofNullable(this.expiresInMills);
+    }
+
+    private String getTokenFromFile() {
+        try {
+            return FileIOUtils.readFileUtf8(new File(tokenFilePath));
+        } catch (IOException e) {
+            throw new UncheckedIOException(e);
+        }
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProviderFactory.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProviderFactory.java
new file mode 100644
index 0000000000000..a0fa6b405d622
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/BearTokenFileCredentialsProviderFactory.java
@@ -0,0 +1,48 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.options.Options;
+
+import static org.apache.paimon.rest.RESTCatalogOptions.TOKEN_EXPIRATION_TIME;
+import static org.apache.paimon.rest.RESTCatalogOptions.TOKEN_PROVIDER_PATH;
+
+/** factory for create {@link BearTokenCredentialsProvider}. */
+public class BearTokenFileCredentialsProviderFactory implements CredentialsProviderFactory {
+
+    @Override
+    public String identifier() {
+        return CredentialsProviderType.BEAR_TOKEN_FILE.name();
+    }
+
+    @Override
+    public CredentialsProvider create(Options options) {
+        if (!options.getOptional(TOKEN_PROVIDER_PATH).isPresent()) {
+            throw new IllegalArgumentException(TOKEN_PROVIDER_PATH.key() + " is required");
+        }
+        String tokenFilePath = options.get(TOKEN_PROVIDER_PATH);
+        if (options.getOptional(TOKEN_EXPIRATION_TIME).isPresent()) {
+            long tokenExpireInMills = options.get(TOKEN_EXPIRATION_TIME).toMillis();
+            return new BearTokenFileCredentialsProvider(tokenFilePath, tokenExpireInMills);
+
+        } else {
+            return new BearTokenFileCredentialsProvider(tokenFilePath);
+        }
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProvider.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProvider.java
new file mode 100644
index 0000000000000..7fe8008e59475
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProvider.java
@@ -0,0 +1,50 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import java.util.Map;
+import java.util.Optional;
+
+/** Credentials provider. */
+public interface CredentialsProvider {
+
+    Map<String, String> authHeader();
+
+    boolean refresh();
+
+    default boolean supportRefresh() {
+        return false;
+    }
+
+    default boolean keepRefreshed() {
+        return false;
+    }
+
+    default boolean willSoonExpire() {
+        return false;
+    }
+
+    default Optional<Long> expiresAtMillis() {
+        return Optional.empty();
+    }
+
+    default Optional<Long> expiresInMills() {
+        return Optional.empty();
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderFactory.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderFactory.java
new file mode 100644
index 0000000000000..50c3564ad8c68
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderFactory.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.factories.Factory;
+import org.apache.paimon.factories.FactoryUtil;
+import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.RESTCatalogOptions;
+
+import static org.apache.paimon.rest.RESTCatalogInternalOptions.CREDENTIALS_PROVIDER;
+
+/** Factory for creating {@link CredentialsProvider}. */
+public interface CredentialsProviderFactory extends Factory {
+
+    default CredentialsProvider create(Options options) {
+        throw new UnsupportedOperationException(
+                "Use  create(context) for " + this.getClass().getSimpleName());
+    }
+
+    static CredentialsProvider createCredentialsProvider(Options options, ClassLoader classLoader) {
+        String credentialsProviderIdentifier = getCredentialsProviderTypeByConf(options).name();
+        CredentialsProviderFactory credentialsProviderFactory =
+                FactoryUtil.discoverFactory(
+                        classLoader,
+                        CredentialsProviderFactory.class,
+                        credentialsProviderIdentifier);
+        return credentialsProviderFactory.create(options);
+    }
+
+    static CredentialsProviderType getCredentialsProviderTypeByConf(Options options) {
+        if (options.getOptional(CREDENTIALS_PROVIDER).isPresent()) {
+            return CredentialsProviderType.valueOf(options.get(CREDENTIALS_PROVIDER));
+        } else if (options.getOptional(RESTCatalogOptions.TOKEN_PROVIDER_PATH).isPresent()) {
+            return CredentialsProviderType.BEAR_TOKEN_FILE;
+        }
+        return CredentialsProviderType.BEAR_TOKEN;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderType.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderType.java
new file mode 100644
index 0000000000000..28c344d70eee2
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/CredentialsProviderType.java
@@ -0,0 +1,25 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+/** Credentials provider type. */
+public enum CredentialsProviderType {
+    BEAR_TOKEN,
+    BEAR_TOKEN_FILE
+}
diff --git a/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory b/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
index 3b98eef52c851..6416edd720f8d 100644
--- a/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
+++ b/paimon-core/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
@@ -37,3 +37,5 @@ org.apache.paimon.mergetree.compact.aggregate.factory.FieldRoaringBitmap64AggFac
 org.apache.paimon.mergetree.compact.aggregate.factory.FieldSumAggFactory
 org.apache.paimon.mergetree.compact.aggregate.factory.FieldThetaSketchAggFactory
 org.apache.paimon.rest.RESTCatalogFactory
+org.apache.paimon.rest.auth.BearTokenCredentialsProviderFactory
+org.apache.paimon.rest.auth.BearTokenFileCredentialsProviderFactory
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
index 1140e399824cc..17c13b932fd20 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
@@ -18,7 +18,9 @@
 
 package org.apache.paimon.rest;
 
-import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
+import org.apache.paimon.rest.auth.BearTokenCredentialsProvider;
+import org.apache.paimon.rest.auth.CredentialsProvider;
+
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
 import okhttp3.mockwebserver.MockResponse;
@@ -33,8 +35,6 @@
 import java.util.Map;
 import java.util.Optional;
 
-import static org.apache.paimon.rest.RESTCatalog.AUTH_HEADER;
-import static org.apache.paimon.rest.RESTCatalog.AUTH_HEADER_VALUE_FORMAT;
 import static org.junit.Assert.assertEquals;
 import static org.mockito.ArgumentMatchers.any;
 import static org.mockito.Mockito.mock;
@@ -70,7 +70,8 @@ public void setUp() throws IOException {
         mockResponseData = new MockRESTData(MOCK_PATH);
         mockResponseDataStr = objectMapper.writeValueAsString(mockResponseData);
         httpClient = new HttpClient(httpClientOptions);
-        headers = ImmutableMap.of(AUTH_HEADER, String.format(AUTH_HEADER_VALUE_FORMAT, TOKEN));
+        CredentialsProvider credentialsProvider = new BearTokenCredentialsProvider(TOKEN);
+        headers = credentialsProvider.authHeader();
     }
 
     @After
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
new file mode 100644
index 0000000000000..81b3ea57b7032
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
@@ -0,0 +1,130 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.utils.Pair;
+import org.apache.paimon.utils.ThreadPoolUtils;
+
+import org.apache.commons.io.FileUtils;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+import org.mockito.Mockito;
+
+import java.io.File;
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Optional;
+import java.util.UUID;
+import java.util.concurrent.ScheduledExecutorService;
+
+import static org.apache.paimon.rest.auth.AuthSession.TOKEN_REFRESH_NUM_RETRIES;
+import static org.junit.Assert.assertEquals;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.when;
+
+/** Test for {@link AuthSession}. */
+public class AuthSessionTest {
+
+    @Rule public TemporaryFolder folder = new TemporaryFolder();
+
+    @Test
+    public void testRefreshBearTokenFileCredentialsProvider()
+            throws IOException, InterruptedException {
+        String fileName = "token";
+        Pair<File, String> tokenFile2Token = generateTokenAndWriteToFile(fileName);
+        String token = tokenFile2Token.getRight();
+        File tokenFile = tokenFile2Token.getLeft();
+        Map<String, String> initialHeaders = new HashMap<>();
+        long expiresInMillis = 1000L;
+        CredentialsProvider credentialsProvider =
+                new BearTokenFileCredentialsProvider(tokenFile.getPath(), expiresInMillis);
+        ScheduledExecutorService executor =
+                ThreadPoolUtils.createScheduledThreadPool(1, "refresh-token");
+        AuthSession session =
+                AuthSession.fromRefreshCredentialsProvider(
+                        executor, initialHeaders, credentialsProvider);
+        Map<String, String> header = session.getHeaders();
+        assertEquals(header.get("Authorization"), "Bearer " + token);
+        tokenFile.delete();
+        tokenFile2Token = generateTokenAndWriteToFile(fileName);
+        token = tokenFile2Token.getRight();
+        Thread.sleep(expiresInMillis + 500L);
+        header = session.getHeaders();
+        assertEquals(header.get("Authorization"), "Bearer " + token);
+    }
+
+    @Test
+    public void testRefreshCredentialsProviderIsSoonExpire()
+            throws IOException, InterruptedException {
+        String fileName = "token";
+        Pair<File, String> tokenFile2Token = generateTokenAndWriteToFile(fileName);
+        String token = tokenFile2Token.getRight();
+        File tokenFile = tokenFile2Token.getLeft();
+        Map<String, String> initialHeaders = new HashMap<>();
+        long expiresInMillis = 1000L;
+        CredentialsProvider credentialsProvider =
+                new BearTokenFileCredentialsProvider(tokenFile.getPath(), expiresInMillis);
+        AuthSession session =
+                AuthSession.fromRefreshCredentialsProvider(
+                        null, initialHeaders, credentialsProvider);
+        Map<String, String> header = session.getHeaders();
+        assertEquals(header.get("Authorization"), "Bearer " + token);
+        tokenFile.delete();
+        tokenFile2Token = generateTokenAndWriteToFile(fileName);
+        token = tokenFile2Token.getRight();
+        tokenFile = tokenFile2Token.getLeft();
+        FileUtils.writeStringToFile(tokenFile, token);
+        Thread.sleep(
+                (long) (expiresInMillis * (1 - BearTokenFileCredentialsProvider.EXPIRED_FACTOR))
+                        + 10L);
+        header = session.getHeaders();
+        assertEquals(header.get("Authorization"), "Bearer " + token);
+    }
+
+    @Test
+    public void testRetryWhenRefreshFail() throws Exception {
+        Map<String, String> initialHeaders = new HashMap<>();
+        CredentialsProvider credentialsProvider =
+                Mockito.mock(BearTokenFileCredentialsProvider.class);
+        long expiresAtMillis = System.currentTimeMillis() - 1000L;
+        when(credentialsProvider.expiresAtMillis()).thenReturn(Optional.of(expiresAtMillis));
+        when(credentialsProvider.expiresInMills()).thenReturn(Optional.of(50L));
+        when(credentialsProvider.supportRefresh()).thenReturn(true);
+        when(credentialsProvider.keepRefreshed()).thenReturn(true);
+        when(credentialsProvider.refresh()).thenReturn(false);
+        AuthSession session =
+                AuthSession.fromRefreshCredentialsProvider(
+                        null, initialHeaders, credentialsProvider);
+        AuthSession.scheduleTokenRefresh(
+                ThreadPoolUtils.createScheduledThreadPool(1, "refresh-token"),
+                session,
+                expiresAtMillis);
+        Thread.sleep(10_000L);
+        verify(credentialsProvider, Mockito.times(TOKEN_REFRESH_NUM_RETRIES + 1)).refresh();
+    }
+
+    private Pair<File, String> generateTokenAndWriteToFile(String fileName) throws IOException {
+        File tokenFile = folder.newFile(fileName);
+        String token = UUID.randomUUID().toString();
+        FileUtils.writeStringToFile(tokenFile, token);
+        return Pair.of(tokenFile, token);
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/auth/CredentialsProviderFactoryTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/auth/CredentialsProviderFactoryTest.java
new file mode 100644
index 0000000000000..e62a65a79aed6
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/auth/CredentialsProviderFactoryTest.java
@@ -0,0 +1,131 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.auth;
+
+import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.RESTCatalogOptions;
+
+import org.apache.commons.io.FileUtils;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+
+import java.io.File;
+import java.time.Duration;
+import java.util.UUID;
+
+import static org.apache.paimon.rest.RESTCatalogInternalOptions.CREDENTIALS_PROVIDER;
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertThrows;
+
+/** Test for {@link CredentialsProviderFactory}. */
+public class CredentialsProviderFactoryTest {
+
+    @Rule public TemporaryFolder folder = new TemporaryFolder();
+
+    @Test
+    public void testCreateBearTokenCredentialsProviderSuccess() {
+        Options options = new Options();
+        String token = UUID.randomUUID().toString();
+        options.set(RESTCatalogOptions.TOKEN, token);
+        BearTokenCredentialsProvider credentialsProvider =
+                (BearTokenCredentialsProvider)
+                        CredentialsProviderFactory.createCredentialsProvider(
+                                options, this.getClass().getClassLoader());
+        assertEquals(token, credentialsProvider.token());
+    }
+
+    @Test
+    public void testCreateBearTokenCredentialsProviderFail() {
+        Options options = new Options();
+        assertThrows(
+                IllegalArgumentException.class,
+                () ->
+                        CredentialsProviderFactory.createCredentialsProvider(
+                                options, this.getClass().getClassLoader()));
+    }
+
+    @Test
+    public void testCreateBearTokenFileCredentialsProviderSuccess() throws Exception {
+        Options options = new Options();
+        String fileName = "token";
+        File tokenFile = folder.newFile(fileName);
+        String token = UUID.randomUUID().toString();
+        FileUtils.writeStringToFile(tokenFile, token);
+        options.set(RESTCatalogOptions.TOKEN_PROVIDER_PATH, tokenFile.getPath());
+        BearTokenFileCredentialsProvider credentialsProvider =
+                (BearTokenFileCredentialsProvider)
+                        CredentialsProviderFactory.createCredentialsProvider(
+                                options, this.getClass().getClassLoader());
+        assertEquals(token, credentialsProvider.token());
+    }
+
+    @Test
+    public void testCreateBearTokenFileCredentialsProviderFail() throws Exception {
+        Options options = new Options();
+        options.set(CREDENTIALS_PROVIDER, CredentialsProviderType.BEAR_TOKEN_FILE.name());
+        assertThrows(
+                IllegalArgumentException.class,
+                () ->
+                        CredentialsProviderFactory.createCredentialsProvider(
+                                options, this.getClass().getClassLoader()));
+    }
+
+    @Test
+    public void testCreateRefreshBearTokenFileCredentialsProviderSuccess() throws Exception {
+        Options options = new Options();
+        String fileName = "token";
+        File tokenFile = folder.newFile(fileName);
+        String token = UUID.randomUUID().toString();
+        FileUtils.writeStringToFile(tokenFile, token);
+        options.set(RESTCatalogOptions.TOKEN_PROVIDER_PATH, tokenFile.getPath());
+        options.set(RESTCatalogOptions.TOKEN_EXPIRATION_TIME, Duration.ofSeconds(10L));
+        BearTokenFileCredentialsProvider credentialsProvider =
+                (BearTokenFileCredentialsProvider)
+                        CredentialsProviderFactory.createCredentialsProvider(
+                                options, this.getClass().getClassLoader());
+        assertEquals(token, credentialsProvider.token());
+    }
+
+    @Test
+    public void getCredentialsProviderTypeByConfWhenDefineTokenPath() {
+        Options options = new Options();
+        options.set(RESTCatalogOptions.TOKEN_PROVIDER_PATH, "/a/b/c");
+        assertEquals(
+                CredentialsProviderType.BEAR_TOKEN_FILE,
+                CredentialsProviderFactory.getCredentialsProviderTypeByConf(options));
+    }
+
+    @Test
+    public void getCredentialsProviderTypeByConfWhenConfNotDefined() {
+        Options options = new Options();
+        assertEquals(
+                CredentialsProviderType.BEAR_TOKEN,
+                CredentialsProviderFactory.getCredentialsProviderTypeByConf(options));
+    }
+
+    @Test
+    public void getCredentialsProviderTypeByConfWhenDefineProviderType() {
+        Options options = new Options();
+        options.set(CREDENTIALS_PROVIDER, CredentialsProviderType.BEAR_TOKEN_FILE.name());
+        assertEquals(
+                CredentialsProviderType.BEAR_TOKEN_FILE,
+                CredentialsProviderFactory.getCredentialsProviderTypeByConf(options));
+    }
+}

From 93459f032f088580d72258d1b5a317e6f8d861e7 Mon Sep 17 00:00:00 2001
From: JackeyLee007 <JackeyLee007@126.com>
Date: Tue, 10 Dec 2024 10:32:23 +0800
Subject: [PATCH 126/157] [flink-cdc] kafka_sync_database supports table name
 mapping when prefix and postfix could not fit the need. (#4660)

---
 docs/content/cdc-ingestion/kafka-cdc.md       |  1 +
 .../generated/kafka_sync_database.html        |  4 ++
 .../action/cdc/CdcActionCommonUtils.java      |  1 +
 .../action/cdc/SyncDatabaseActionBase.java    | 11 ++++-
 .../cdc/SyncDatabaseActionFactoryBase.java    |  2 +
 .../flink/action/cdc/TableNameConverter.java  | 31 ++++++++++++-
 .../cdc/mysql/MySqlSyncDatabaseAction.java    |  3 +-
 .../action/cdc/TableNameConverterTest.java    | 45 +++++++++++++++++++
 8 files changed, 94 insertions(+), 4 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java

diff --git a/docs/content/cdc-ingestion/kafka-cdc.md b/docs/content/cdc-ingestion/kafka-cdc.md
index f57260275ea83..b037937c554f1 100644
--- a/docs/content/cdc-ingestion/kafka-cdc.md
+++ b/docs/content/cdc-ingestion/kafka-cdc.md
@@ -198,6 +198,7 @@ To use this feature through `flink run`, run the following shell command.
     kafka_sync_database
     --warehouse <warehouse-path> \
     --database <database-name> \
+    [--table_mapping <table-name>=<paimon-table-name>] \
     [--table_prefix <paimon-table-prefix>] \
     [--table_suffix <paimon-table-suffix>] \
     [--including_tables <table-name|name-regular-expr>] \
diff --git a/docs/layouts/shortcodes/generated/kafka_sync_database.html b/docs/layouts/shortcodes/generated/kafka_sync_database.html
index 888901991d694..6c90f1d7f7d83 100644
--- a/docs/layouts/shortcodes/generated/kafka_sync_database.html
+++ b/docs/layouts/shortcodes/generated/kafka_sync_database.html
@@ -37,6 +37,10 @@
         <td><h5>--ignore_incompatible</h5></td>
         <td>It is default false, in this case, if MySQL table name exists in Paimon and their schema is incompatible,an exception will be thrown. You can specify it to true explicitly to ignore the incompatible tables and exception.</td>
     </tr>
+    <tr>
+        <td><h5>--table_mapping</h5></td>
+        <td>The table name mapping between source database and Paimon. For example, if you want to synchronize a source table named "test" to a Paimon table named "paimon_test", you can specify "--table_mapping test=paimon_test". Multiple mappings could be specified with multiple "--table_mapping" options. "--table_mapping" has higher priority than "--table_prefix" and "--table_suffix".</td>
+    </tr>
     <tr>
         <td><h5>--table_prefix</h5></td>
         <td>The prefix of all Paimon tables to be synchronized. For example, if you want all synchronized tables to have "ods_" as prefix, you can specify "--table_prefix ods_".</td>
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
index 8f96022bde359..83891c90b8e15 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
@@ -56,6 +56,7 @@ public class CdcActionCommonUtils {
     public static final String PULSAR_CONF = "pulsar_conf";
     public static final String TABLE_PREFIX = "table_prefix";
     public static final String TABLE_SUFFIX = "table_suffix";
+    public static final String TABLE_MAPPING = "table_mapping";
     public static final String INCLUDING_TABLES = "including_tables";
     public static final String EXCLUDING_TABLES = "excluding_tables";
     public static final String TYPE_MAPPING = "type_mapping";
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
index 4ab56bdcf1189..ac3483ac23bf0 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
@@ -52,6 +52,7 @@ public abstract class SyncDatabaseActionBase extends SynchronizationActionBase {
     protected MultiTablesSinkMode mode = COMBINED;
     protected String tablePrefix = "";
     protected String tableSuffix = "";
+    protected Map<String, String> tableMapping = new HashMap<>();
     protected String includingTables = ".*";
     protected List<String> partitionKeys = new ArrayList<>();
     protected List<String> primaryKeys = new ArrayList<>();
@@ -97,6 +98,13 @@ public SyncDatabaseActionBase withTableSuffix(@Nullable String tableSuffix) {
         return this;
     }
 
+    public SyncDatabaseActionBase withTableMapping(Map<String, String> tableMapping) {
+        if (tableMapping != null) {
+            this.tableMapping = tableMapping;
+        }
+        return this;
+    }
+
     public SyncDatabaseActionBase includingTables(@Nullable String includingTables) {
         if (includingTables != null) {
             this.includingTables = includingTables;
@@ -155,7 +163,8 @@ protected EventParser.Factory<RichCdcMultiplexRecord> buildEventParserFactory()
         Pattern excludingPattern =
                 excludingTables == null ? null : Pattern.compile(excludingTables);
         TableNameConverter tableNameConverter =
-                new TableNameConverter(allowUpperCase, mergeShards, tablePrefix, tableSuffix);
+                new TableNameConverter(
+                        allowUpperCase, mergeShards, tablePrefix, tableSuffix, tableMapping);
         Set<String> createdTables;
         try {
             createdTables = new HashSet<>(catalog.listTables(database));
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
index e7a386979d4e7..2135f2a28112d 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
@@ -29,6 +29,7 @@
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.MULTIPLE_TABLE_PARTITION_KEYS;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.PARTITION_KEYS;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.PRIMARY_KEYS;
+import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_MAPPING;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_PREFIX;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_SUFFIX;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TYPE_MAPPING;
@@ -51,6 +52,7 @@ public Optional<Action> create(MultipleParameterToolAdapter params) {
     protected void withParams(MultipleParameterToolAdapter params, T action) {
         action.withTablePrefix(params.get(TABLE_PREFIX))
                 .withTableSuffix(params.get(TABLE_SUFFIX))
+                .withTableMapping(optionalConfigMap(params, TABLE_MAPPING))
                 .includingTables(params.get(INCLUDING_TABLES))
                 .excludingTables(params.get(EXCLUDING_TABLES))
                 .withPartitionKeyMultiple(
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
index 67c70aa58cdb0..4eca8b903ed1e 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
@@ -21,6 +21,8 @@
 import org.apache.paimon.catalog.Identifier;
 
 import java.io.Serializable;
+import java.util.HashMap;
+import java.util.Map;
 
 /** Used to convert a MySQL source table name to corresponding Paimon table name. */
 public class TableNameConverter implements Serializable {
@@ -31,20 +33,31 @@ public class TableNameConverter implements Serializable {
     private final boolean mergeShards;
     private final String prefix;
     private final String suffix;
+    private final Map<String, String> tableMapping;
 
     public TableNameConverter(boolean caseSensitive) {
-        this(caseSensitive, true, "", "");
+        this(caseSensitive, true, "", "", null);
     }
 
     public TableNameConverter(
-            boolean caseSensitive, boolean mergeShards, String prefix, String suffix) {
+            boolean caseSensitive,
+            boolean mergeShards,
+            String prefix,
+            String suffix,
+            Map<String, String> tableMapping) {
         this.caseSensitive = caseSensitive;
         this.mergeShards = mergeShards;
         this.prefix = prefix;
         this.suffix = suffix;
+        this.tableMapping = lowerMapKey(tableMapping);
     }
 
     public String convert(String originName) {
+        if (tableMapping.containsKey(originName.toLowerCase())) {
+            String mappedName = tableMapping.get(originName.toLowerCase());
+            return caseSensitive ? mappedName : mappedName.toLowerCase();
+        }
+
         String tableName = caseSensitive ? originName : originName.toLowerCase();
         return prefix + tableName + suffix;
     }
@@ -58,4 +71,18 @@ public String convert(Identifier originIdentifier) {
                                 + originIdentifier.getObjectName();
         return convert(rawName);
     }
+
+    private Map<String, String> lowerMapKey(Map<String, String> map) {
+        int size = map == null ? 0 : map.size();
+        Map<String, String> lowerKeyMap = new HashMap<>(size);
+        if (size == 0) {
+            return lowerKeyMap;
+        }
+
+        for (String key : map.keySet()) {
+            lowerKeyMap.put(key.toLowerCase(), map.get(key));
+        }
+
+        return lowerKeyMap;
+    }
 }
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
index f8ea8cdc44386..235b3f9a3235f 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
@@ -138,7 +138,8 @@ protected void beforeBuildingSourceSink() throws Exception {
                         + ", or MySQL database does not exist.");
 
         TableNameConverter tableNameConverter =
-                new TableNameConverter(allowUpperCase, mergeShards, tablePrefix, tableSuffix);
+                new TableNameConverter(
+                        allowUpperCase, mergeShards, tablePrefix, tableSuffix, tableMapping);
         for (JdbcTableInfo tableInfo : jdbcTableInfos) {
             Identifier identifier =
                     Identifier.create(
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java
new file mode 100644
index 0000000000000..dfbe32e3d398b
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java
@@ -0,0 +1,45 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.action.cdc;
+
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/** Tests for {@link TableNameConverter}. */
+public class TableNameConverterTest {
+
+    @Test
+    public void testConvertTableName() {
+        Map<String, String> tableMapping = new HashMap<>(1);
+        tableMapping.put("mapped_src", "mapped_TGT");
+        TableNameConverter caseConverter =
+                new TableNameConverter(true, true, "pre_", "_pos", tableMapping);
+        Assert.assertEquals(caseConverter.convert("mapped_SRC"), "mapped_TGT");
+
+        Assert.assertEquals(caseConverter.convert("unmapped_src"), "pre_unmapped_src_pos");
+
+        TableNameConverter noCaseConverter =
+                new TableNameConverter(false, true, "pre_", "_pos", tableMapping);
+        Assert.assertEquals(noCaseConverter.convert("mapped_src"), "mapped_tgt");
+        Assert.assertEquals(noCaseConverter.convert("unmapped_src"), "pre_unmapped_src_pos");
+    }
+}

From 02204e7ac746fb1b6a97d74e3c490eec14e5305e Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 10 Dec 2024 10:32:53 +0800
Subject: [PATCH 127/157] [minor] Fix RESTCatalog.close should close client and
 refreshExecutor

---
 .../apache/paimon/utils/ThreadPoolUtils.java  |  5 +---
 .../org/apache/paimon/rest/RESTCatalog.java   | 26 ++++++++++++-------
 .../paimon/rest/RESTCatalogOptions.java       |  7 +++++
 .../org/apache/paimon/rest/ResourcePaths.java |  1 +
 .../apache/paimon/rest/RESTCatalogTest.java   |  3 ++-
 5 files changed, 28 insertions(+), 14 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
index c64b9e26ea6e0..e4b3da8ca8c3f 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/ThreadPoolUtils.java
@@ -20,7 +20,6 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.Iterators;
 import org.apache.paimon.shade.guava30.com.google.common.collect.Lists;
-import org.apache.paimon.shade.guava30.com.google.common.util.concurrent.ThreadFactoryBuilder;
 
 import javax.annotation.Nullable;
 
@@ -81,9 +80,7 @@ public static ThreadPoolExecutor createCachedThreadPool(
 
     public static ScheduledExecutorService createScheduledThreadPool(
             int threadNum, String namePrefix) {
-        return new ScheduledThreadPoolExecutor(
-                threadNum,
-                new ThreadFactoryBuilder().setDaemon(true).setNameFormat(namePrefix).build());
+        return new ScheduledThreadPoolExecutor(threadNum, newDaemonThreadFactory(namePrefix));
     }
 
     /** This method aims to parallel process tasks with memory control and sequentially. */
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
index e18946b3374b7..f3007bf4bf025 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
@@ -47,15 +47,16 @@
 
 /** A catalog implementation for REST. */
 public class RESTCatalog implements Catalog {
-    private RESTClient client;
-    private ResourcePaths resourcePaths;
-    private Map<String, String> options;
-    private Map<String, String> baseHeader;
-    // a lazy thread pool for token refresh
+
+    private static final ObjectMapper OBJECT_MAPPER = RESTObjectMapper.create();
+
+    private final RESTClient client;
+    private final ResourcePaths resourcePaths;
+    private final Map<String, String> options;
+    private final Map<String, String> baseHeader;
     private final AuthSession catalogAuth;
-    private volatile ScheduledExecutorService refreshExecutor = null;
 
-    private static final ObjectMapper objectMapper = RESTObjectMapper.create();
+    private volatile ScheduledExecutorService refreshExecutor = null;
 
     public RESTCatalog(Options options) {
         if (options.getOptional(CatalogOptions.WAREHOUSE).isPresent()) {
@@ -71,7 +72,7 @@ public RESTCatalog(Options options) {
                         uri,
                         connectTimeout,
                         readTimeout,
-                        objectMapper,
+                        OBJECT_MAPPER,
                         threadPoolSize,
                         DefaultErrorHandler.getInstance());
         this.client = new HttpClient(httpClientOptions);
@@ -194,7 +195,14 @@ public boolean allowUpperCase() {
     }
 
     @Override
-    public void close() throws Exception {}
+    public void close() throws Exception {
+        if (refreshExecutor != null) {
+            refreshExecutor.shutdownNow();
+        }
+        if (client != null) {
+            client.close();
+        }
+    }
 
     @VisibleForTesting
     Map<String, String> fetchOptionsFromServer(
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
index 8f7bea91dcd35..1af64def4f714 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogOptions.java
@@ -25,31 +25,37 @@
 
 /** Options for REST Catalog. */
 public class RESTCatalogOptions {
+
     public static final ConfigOption<String> URI =
             ConfigOptions.key("uri")
                     .stringType()
                     .noDefaultValue()
                     .withDescription("REST Catalog server's uri.");
+
     public static final ConfigOption<Duration> CONNECTION_TIMEOUT =
             ConfigOptions.key("rest.client.connection-timeout")
                     .durationType()
                     .noDefaultValue()
                     .withDescription("REST Catalog http client connect timeout.");
+
     public static final ConfigOption<Duration> READ_TIMEOUT =
             ConfigOptions.key("rest.client.read-timeout")
                     .durationType()
                     .noDefaultValue()
                     .withDescription("REST Catalog http client read timeout.");
+
     public static final ConfigOption<Integer> THREAD_POOL_SIZE =
             ConfigOptions.key("rest.client.num-threads")
                     .intType()
                     .defaultValue(1)
                     .withDescription("REST Catalog http client thread num.");
+
     public static final ConfigOption<String> TOKEN =
             ConfigOptions.key("token")
                     .stringType()
                     .noDefaultValue()
                     .withDescription("REST Catalog auth token.");
+
     public static final ConfigOption<Duration> TOKEN_EXPIRATION_TIME =
             ConfigOptions.key("token.expiration-time")
                     .durationType()
@@ -59,6 +65,7 @@ public class RESTCatalogOptions {
                                     + " the token expires time is t2, we need to guarantee that t2 > t1,"
                                     + " the token validity time is [t2 - t1, t2],"
                                     + " and the expires time defined here needs to be less than (t2 - t1)");
+
     public static final ConfigOption<String> TOKEN_PROVIDER_PATH =
             ConfigOptions.key("token.provider.path")
                     .stringType()
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
index 1fad87588a33e..aaca6193802d8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
@@ -20,6 +20,7 @@
 
 /** Resource paths for REST catalog. */
 public class ResourcePaths {
+
     public static final String V1_CONFIG = "/api/v1/config";
 
     public static ResourcePaths forCatalogProperties(String prefix) {
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
index 3ed8730862ee5..f3f56e97215f2 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
@@ -36,9 +36,9 @@
 
 /** Test for REST Catalog. */
 public class RESTCatalogTest {
+
     private MockWebServer mockWebServer;
     private RESTCatalog restCatalog;
-    private final String initToken = "init_token";
 
     @Before
     public void setUp() throws IOException {
@@ -47,6 +47,7 @@ public void setUp() throws IOException {
         String baseUrl = mockWebServer.url("").toString();
         Options options = new Options();
         options.set(RESTCatalogOptions.URI, baseUrl);
+        String initToken = "init_token";
         options.set(RESTCatalogOptions.TOKEN, initToken);
         options.set(RESTCatalogOptions.THREAD_POOL_SIZE, 1);
         mockOptions(RESTCatalogInternalOptions.PREFIX.key(), "prefix");

From 8b4a77a1e1f29864787a63cea96ba1d34eea39fc Mon Sep 17 00:00:00 2001
From: xuzifu666 <1206332514@qq.com>
Date: Tue, 10 Dec 2024 14:01:13 +0800
Subject: [PATCH 128/157] [core] Introduce timeout for commit retry avoid long
 time loop (#4668)

---
 .../generated/core_configuration.html         |  6 +++++
 .../java/org/apache/paimon/CoreOptions.java   | 12 ++++++++++
 .../org/apache/paimon/AbstractFileStore.java  |  3 ++-
 .../paimon/operation/FileStoreCommitImpl.java | 23 +++++++++++++------
 tools/maven/checkstyle.xml                    |  2 +-
 5 files changed, 37 insertions(+), 9 deletions(-)

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 7d6bacccb0266..52b64a3a565db 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -134,6 +134,12 @@
             <td>Integer</td>
             <td>Maximum number of retries when commit failed.</td>
         </tr>
+        <tr>
+            <td><h5>commit.timeout</h5></td>
+            <td style="word-wrap: break-word;">(none)</td>
+            <td>Duration</td>
+            <td>Timeout duration of retry when commit failed.</td>
+        </tr>
         <tr>
             <td><h5>commit.user-prefix</h5></td>
             <td style="word-wrap: break-word;">(none)</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index 8aebf2f289a00..f42bb8aeca985 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -527,6 +527,12 @@ public class CoreOptions implements Serializable {
                     .defaultValue(false)
                     .withDescription("Whether to force a compaction before commit.");
 
+    public static final ConfigOption<Duration> COMMIT_TIMEOUT =
+            key("commit.timeout")
+                    .durationType()
+                    .noDefaultValue()
+                    .withDescription("Timeout duration of retry when commit failed.");
+
     public static final ConfigOption<Integer> COMMIT_MAX_RETRIES =
             key("commit.max-retries")
                     .intType()
@@ -1929,6 +1935,12 @@ public boolean commitForceCompact() {
         return options.get(COMMIT_FORCE_COMPACT);
     }
 
+    public long commitTimeout() {
+        return options.get(COMMIT_TIMEOUT) == null
+                ? Long.MAX_VALUE
+                : options.get(COMMIT_TIMEOUT).toMillis();
+    }
+
     public int commitMaxRetries() {
         return options.get(COMMIT_MAX_RETRIES);
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
index 54f554aa46d35..e6d63149149c4 100644
--- a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
@@ -237,7 +237,8 @@ public FileStoreCommitImpl newCommit(String commitUser, List<CommitCallback> cal
                 bucketMode(),
                 options.scanManifestParallelism(),
                 callbacks,
-                options.commitMaxRetries());
+                options.commitMaxRetries(),
+                options.commitTimeout());
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
index 547c6e29be471..001132e1671c1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/FileStoreCommitImpl.java
@@ -135,6 +135,7 @@ public class FileStoreCommitImpl implements FileStoreCommit {
     private final List<CommitCallback> commitCallbacks;
     private final StatsFileHandler statsFileHandler;
     private final BucketMode bucketMode;
+    private long commitTimeout;
     private final int commitMaxRetries;
 
     @Nullable private Lock lock;
@@ -167,7 +168,8 @@ public FileStoreCommitImpl(
             BucketMode bucketMode,
             @Nullable Integer manifestReadParallelism,
             List<CommitCallback> commitCallbacks,
-            int commitMaxRetries) {
+            int commitMaxRetries,
+            long commitTimeout) {
         this.fileIO = fileIO;
         this.schemaManager = schemaManager;
         this.tableName = tableName;
@@ -194,6 +196,7 @@ public FileStoreCommitImpl(
         this.manifestReadParallelism = manifestReadParallelism;
         this.commitCallbacks = commitCallbacks;
         this.commitMaxRetries = commitMaxRetries;
+        this.commitTimeout = commitTimeout;
 
         this.lock = null;
         this.ignoreEmptyCommit = true;
@@ -733,6 +736,7 @@ private int tryCommit(
             @Nullable String statsFileName) {
         int retryCount = 0;
         RetryResult retryResult = null;
+        long startMillis = System.currentTimeMillis();
         while (true) {
             Snapshot latestSnapshot = snapshotManager.latestSnapshot();
             CommitResult result =
@@ -756,13 +760,15 @@ private int tryCommit(
 
             retryResult = (RetryResult) result;
 
-            if (retryCount >= commitMaxRetries) {
+            if (System.currentTimeMillis() - startMillis > commitTimeout
+                    || retryCount >= commitMaxRetries) {
                 retryResult.cleanAll();
                 throw new RuntimeException(
                         String.format(
-                                "Commit failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
-                                commitMaxRetries));
+                                "Commit failed after %s millis with %s retries, there maybe exist commit conflicts between multiple jobs.",
+                                commitTimeout, retryCount));
             }
+
             retryCount++;
         }
         return retryCount + 1;
@@ -1062,19 +1068,22 @@ CommitResult tryCommitOnce(
     public void compactManifest() {
         int retryCount = 0;
         ManifestCompactResult retryResult = null;
+        long startMillis = System.currentTimeMillis();
         while (true) {
             retryResult = compactManifest(retryResult);
             if (retryResult.isSuccess()) {
                 break;
             }
 
-            if (retryCount >= commitMaxRetries) {
+            if (System.currentTimeMillis() - startMillis > commitTimeout
+                    || retryCount >= commitMaxRetries) {
                 retryResult.cleanAll();
                 throw new RuntimeException(
                         String.format(
-                                "Commit compact manifest failed after %s retries, there maybe exist commit conflicts between multiple jobs.",
-                                commitMaxRetries));
+                                "Commit failed after %s millis with %s retries, there maybe exist commit conflicts between multiple jobs.",
+                                commitTimeout, retryCount));
             }
+
             retryCount++;
         }
     }
diff --git a/tools/maven/checkstyle.xml b/tools/maven/checkstyle.xml
index d5db52cb03df6..80e785353526f 100644
--- a/tools/maven/checkstyle.xml
+++ b/tools/maven/checkstyle.xml
@@ -74,7 +74,7 @@ This file is based on the checkstyle file of Apache Beam.
 	-->
 
 	<module name="FileLength">
-		<property name="max" value="3000"/>
+		<property name="max" value="4000"/>
 	</module>
 
 	<!-- All Java AST specific tests live under TreeWalker module. -->

From b6fb4715021a2261230773645f114fb7140dcc08 Mon Sep 17 00:00:00 2001
From: Jingsong Lee <jingsonglee0@gmail.com>
Date: Tue, 10 Dec 2024 14:01:22 +0800
Subject: [PATCH 129/157] [core] Introduce data-file.path-directory (#4672)

---
 .../migration/iceberg-compatibility.md        |  6 ++++++
 .../generated/core_configuration.html         |  6 ++++++
 .../java/org/apache/paimon/CoreOptions.java   | 11 ++++++++++
 .../org/apache/paimon/AbstractFileStore.java  |  9 ++++++--
 .../org/apache/paimon/KeyValueFileStore.java  | 15 +------------
 .../paimon/utils/FileStorePathFactory.java    | 13 ++++++++++--
 .../paimon/io/KeyValueFileReadWriteTest.java  |  6 ++++--
 .../manifest/ManifestFileMetaTestBase.java    |  3 ++-
 .../paimon/manifest/ManifestFileTest.java     |  3 ++-
 .../paimon/manifest/ManifestListTest.java     |  3 ++-
 .../table/AppendOnlyFileStoreTableTest.java   | 21 +++++++++++++++++++
 .../utils/FileStorePathFactoryTest.java       |  6 ++++--
 .../source/TestChangelogDataReadWrite.java    |  3 ++-
 .../paimon/spark/SparkFileIndexITCase.java    |  3 ++-
 14 files changed, 81 insertions(+), 27 deletions(-)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 8a1637d7e96e8..54018b073f91f 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -402,6 +402,12 @@ You can use Hive Catalog to connect AWS Glue metastore, you can use set `'metada
 AWS Athena may use old manifest reader to read Iceberg manifest by names, we should let Paimon producing legacy Iceberg
 manifest list file, you can enable: `'metadata.iceberg.manifest-legacy-version'`.
 
+## DuckDB
+
+Duckdb may rely on files placed in the `root/data` directory, while Paimon is usually placed directly in the `root`
+directory, so you can configure this parameter for the table to achieve compatibility:
+`'data-file.path-directory' = 'data'`.
+
 ## Trino Iceberg
 
 In this example, we use Trino Iceberg connector to access Paimon table through Iceberg Hive catalog.
diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index 52b64a3a565db..b2bd3a976d66d 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -218,6 +218,12 @@
             <td>Duration</td>
             <td>The TTL in rocksdb index for cross partition upsert (primary keys not contain all partition fields), this can avoid maintaining too many indexes and lead to worse and worse performance, but please note that this may also cause data duplication.</td>
         </tr>
+        <tr>
+            <td><h5>data-file.path-directory</h5></td>
+            <td style="word-wrap: break-word;">(none)</td>
+            <td>String</td>
+            <td>Specify the path directory of data files.</td>
+        </tr>
         <tr>
             <td><h5>data-file.prefix</h5></td>
             <td style="word-wrap: break-word;">"data-"</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index f42bb8aeca985..5db809cff1d1f 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -184,6 +184,12 @@ public class CoreOptions implements Serializable {
                     .defaultValue("data-")
                     .withDescription("Specify the file name prefix of data files.");
 
+    public static final ConfigOption<String> DATA_FILE_PATH_DIRECTORY =
+            key("data-file.path-directory")
+                    .stringType()
+                    .noDefaultValue()
+                    .withDescription("Specify the path directory of data files.");
+
     public static final ConfigOption<String> CHANGELOG_FILE_PREFIX =
             key("changelog-file.prefix")
                     .stringType()
@@ -1638,6 +1644,11 @@ public String dataFilePrefix() {
         return options.get(DATA_FILE_PREFIX);
     }
 
+    @Nullable
+    public String dataFilePathDirectory() {
+        return options.get(DATA_FILE_PATH_DIRECTORY);
+    }
+
     public String changelogFilePrefix() {
         return options.get(CHANGELOG_FILE_PREFIX);
     }
diff --git a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
index e6d63149149c4..1caff252a6547 100644
--- a/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/AbstractFileStore.java
@@ -105,16 +105,21 @@ protected AbstractFileStore(
 
     @Override
     public FileStorePathFactory pathFactory() {
+        return pathFactory(options.fileFormat().getFormatIdentifier());
+    }
+
+    protected FileStorePathFactory pathFactory(String format) {
         return new FileStorePathFactory(
                 options.path(),
                 partitionType,
                 options.partitionDefaultName(),
-                options.fileFormat().getFormatIdentifier(),
+                format,
                 options.dataFilePrefix(),
                 options.changelogFilePrefix(),
                 options.legacyPartitionName(),
                 options.fileSuffixIncludeCompression(),
-                options.fileCompression());
+                options.fileCompression(),
+                options.dataFilePathDirectory());
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/KeyValueFileStore.java b/paimon-core/src/main/java/org/apache/paimon/KeyValueFileStore.java
index 1c87a087e44eb..8cf45105c01b8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/KeyValueFileStore.java
+++ b/paimon-core/src/main/java/org/apache/paimon/KeyValueFileStore.java
@@ -194,20 +194,7 @@ private Map<String, FileStorePathFactory> format2PathFactory() {
         Map<String, FileStorePathFactory> pathFactoryMap = new HashMap<>();
         Set<String> formats = new HashSet<>(options.fileFormatPerLevel().values());
         formats.add(options.fileFormat().getFormatIdentifier());
-        formats.forEach(
-                format ->
-                        pathFactoryMap.put(
-                                format,
-                                new FileStorePathFactory(
-                                        options.path(),
-                                        partitionType,
-                                        options.partitionDefaultName(),
-                                        format,
-                                        options.dataFilePrefix(),
-                                        options.changelogFilePrefix(),
-                                        options.legacyPartitionName(),
-                                        options.fileSuffixIncludeCompression(),
-                                        options.fileCompression())));
+        formats.forEach(format -> pathFactoryMap.put(format, pathFactory(format)));
         return pathFactoryMap;
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/FileStorePathFactory.java b/paimon-core/src/main/java/org/apache/paimon/utils/FileStorePathFactory.java
index fcdc4634d74ab..8896ec3286802 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/FileStorePathFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/FileStorePathFactory.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.io.DataFilePathFactory;
 import org.apache.paimon.types.RowType;
 
+import javax.annotation.Nullable;
 import javax.annotation.concurrent.ThreadSafe;
 
 import java.util.List;
@@ -46,6 +47,8 @@ public class FileStorePathFactory {
     private final boolean fileSuffixIncludeCompression;
     private final String fileCompression;
 
+    @Nullable private final String dataFilePathDirectory;
+
     private final AtomicInteger manifestFileCount;
     private final AtomicInteger manifestListCount;
     private final AtomicInteger indexManifestCount;
@@ -61,8 +64,10 @@ public FileStorePathFactory(
             String changelogFilePrefix,
             boolean legacyPartitionName,
             boolean fileSuffixIncludeCompression,
-            String fileCompression) {
+            String fileCompression,
+            @Nullable String dataFilePathDirectory) {
         this.root = root;
+        this.dataFilePathDirectory = dataFilePathDirectory;
         this.uuid = UUID.randomUUID().toString();
 
         this.partitionComputer =
@@ -125,7 +130,11 @@ public DataFilePathFactory createDataFilePathFactory(BinaryRow partition, int bu
     }
 
     public Path bucketPath(BinaryRow partition, int bucket) {
-        return new Path(root + "/" + relativePartitionAndBucketPath(partition, bucket));
+        Path dataFileRoot = this.root;
+        if (dataFilePathDirectory != null) {
+            dataFileRoot = new Path(dataFileRoot, dataFilePathDirectory);
+        }
+        return new Path(dataFileRoot + "/" + relativePartitionAndBucketPath(partition, bucket));
     }
 
     public Path relativePartitionAndBucketPath(BinaryRow partition, int bucket) {
diff --git a/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java b/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
index 52d56afad8134..b648e2af89727 100644
--- a/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
@@ -231,7 +231,8 @@ protected KeyValueFileWriterFactory createWriterFactory(String pathStr, String f
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
         int suggestedFileSize = ThreadLocalRandom.current().nextInt(8192) + 1024;
         FileIO fileIO = FileIOFinder.find(path);
         Options options = new Options();
@@ -250,7 +251,8 @@ protected KeyValueFileWriterFactory createWriterFactory(String pathStr, String f
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue()));
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null));
 
         return KeyValueFileWriterFactory.builder(
                         fileIO,
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTestBase.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTestBase.java
index 5e69035ca8348..52d82e76be2ab 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTestBase.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTestBase.java
@@ -149,7 +149,8 @@ protected ManifestFile createManifestFile(String pathStr) {
                                 CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                                 CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                                 CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                                CoreOptions.FILE_COMPRESSION.defaultValue()),
+                                CoreOptions.FILE_COMPRESSION.defaultValue(),
+                                null),
                         Long.MAX_VALUE,
                         null)
                 .create();
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileTest.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileTest.java
index 34cca41e61a1f..089e11656a995 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileTest.java
@@ -105,7 +105,8 @@ private ManifestFile createManifestFile(String pathStr) {
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
         int suggestedFileSize = ThreadLocalRandom.current().nextInt(8192) + 1024;
         FileIO fileIO = FileIOFinder.find(path);
         return new ManifestFile.Factory(
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestListTest.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestListTest.java
index ce4f7b8072d2a..5bf01f32cb07d 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestListTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestListTest.java
@@ -109,7 +109,8 @@ private ManifestList createManifestList(String pathStr) {
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
         return new ManifestList.Factory(FileIOFinder.find(path), avro, "zstd", pathFactory, null)
                 .create();
     }
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
index 922221bb8dc99..01d4e89af95d6 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/AppendOnlyFileStoreTableTest.java
@@ -78,6 +78,7 @@
 
 import static org.apache.paimon.CoreOptions.BUCKET;
 import static org.apache.paimon.CoreOptions.BUCKET_KEY;
+import static org.apache.paimon.CoreOptions.DATA_FILE_PATH_DIRECTORY;
 import static org.apache.paimon.CoreOptions.FILE_INDEX_IN_MANIFEST_THRESHOLD;
 import static org.apache.paimon.CoreOptions.METADATA_STATS_MODE;
 import static org.apache.paimon.io.DataFileTestUtils.row;
@@ -143,6 +144,26 @@ public void testBatchReadWrite() throws Exception {
                                 "2|21|201|binary|varbinary|mapKey:mapVal|multiset"));
     }
 
+    @Test
+    public void testReadWriteWithDataDirectory() throws Exception {
+        Consumer<Options> optionsSetter = options -> options.set(DATA_FILE_PATH_DIRECTORY, "data");
+        writeData(optionsSetter);
+        FileStoreTable table = createFileStoreTable(optionsSetter);
+
+        assertThat(table.fileIO().exists(new Path(tablePath, "data/pt=1"))).isTrue();
+
+        List<Split> splits = toSplits(table.newSnapshotReader().read().dataSplits());
+        TableRead read = table.newRead();
+        assertThat(getResult(read, splits, binaryRow(1), 0, BATCH_ROW_TO_STRING))
+                .hasSameElementsAs(
+                        Arrays.asList(
+                                "1|10|100|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|11|101|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|12|102|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|11|101|binary|varbinary|mapKey:mapVal|multiset",
+                                "1|12|102|binary|varbinary|mapKey:mapVal|multiset"));
+    }
+
     @Test
     public void testBatchRecordsWrite() throws Exception {
         FileStoreTable table = createFileStoreTable();
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/FileStorePathFactoryTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/FileStorePathFactoryTest.java
index d4d45b3129614..6ca15cf1503d7 100644
--- a/paimon-core/src/test/java/org/apache/paimon/utils/FileStorePathFactoryTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/FileStorePathFactoryTest.java
@@ -90,7 +90,8 @@ public void testCreateDataFilePathFactoryWithPartition() {
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
 
         assertPartition("20211224", 16, pathFactory, "/dt=20211224/hr=16");
         assertPartition("20211224", null, pathFactory, "/dt=20211224/hr=default");
@@ -130,6 +131,7 @@ public static FileStorePathFactory createNonPartFactory(Path root) {
                 CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                 CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                 CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                CoreOptions.FILE_COMPRESSION.defaultValue());
+                CoreOptions.FILE_COMPRESSION.defaultValue(),
+                null);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
index 85679e5fd30af..17e63700faac7 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
@@ -110,7 +110,8 @@ public TestChangelogDataReadWrite(String root) {
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
         this.snapshotManager = new SnapshotManager(LocalFileIO.create(), new Path(root));
         this.commitUser = UUID.randomUUID().toString();
     }
diff --git a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
index 7da8f2e6b7fe0..0360def685b6b 100644
--- a/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
+++ b/paimon-spark/paimon-spark-ut/src/test/java/org/apache/paimon/spark/SparkFileIndexITCase.java
@@ -160,7 +160,8 @@ protected void foreachIndexReader(Consumer<FileIndexReader> consumer)
                         CoreOptions.CHANGELOG_FILE_PREFIX.defaultValue(),
                         CoreOptions.PARTITION_GENERATE_LEGCY_NAME.defaultValue(),
                         CoreOptions.FILE_SUFFIX_INCLUDE_COMPRESSION.defaultValue(),
-                        CoreOptions.FILE_COMPRESSION.defaultValue());
+                        CoreOptions.FILE_COMPRESSION.defaultValue(),
+                        null);
 
         Table table = fileSystemCatalog.getTable(Identifier.create("db", "T"));
         ReadBuilder readBuilder = table.newReadBuilder();

From 369141963500bb938cf40559e6418abf0f41cedd Mon Sep 17 00:00:00 2001
From: YeJunHao <41894543+leaves12138@users.noreply.github.com>
Date: Tue, 10 Dec 2024 14:05:17 +0800
Subject: [PATCH 130/157] [core] Trim key field in reading, map it to value
 field (#4651)

This closes #4651.

---------

Co-authored-by: tsreaper <tsreaper96@gmail.com>
---
 .../data/columnar/ColumnarRowIterator.java    |   2 +-
 .../apache/paimon/table/SpecialFields.java    |   4 +
 .../paimon/utils/VectorMappingUtils.java      |   3 +-
 .../paimon/utils/VectorMappingUtilsTest.java  |   2 +-
 .../paimon/io/DataFileRecordReader.java       |   1 +
 .../paimon/utils/BulkFormatMapping.java       | 109 +++++++++++--
 .../paimon/manifest/ManifestFileMetaTest.java |   2 +-
 .../paimon/utils/BulkFormatMappingTest.java   | 147 ++++++++++++++++++
 .../source/TestChangelogDataReadWrite.java    |   4 +-
 9 files changed, 257 insertions(+), 17 deletions(-)
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java

diff --git a/paimon-common/src/main/java/org/apache/paimon/data/columnar/ColumnarRowIterator.java b/paimon-common/src/main/java/org/apache/paimon/data/columnar/ColumnarRowIterator.java
index 27e3d1c1ddadf..874c221348646 100644
--- a/paimon-common/src/main/java/org/apache/paimon/data/columnar/ColumnarRowIterator.java
+++ b/paimon-common/src/main/java/org/apache/paimon/data/columnar/ColumnarRowIterator.java
@@ -95,7 +95,7 @@ public ColumnarRowIterator mapping(
                 vectors = VectorMappingUtils.createPartitionMappedVectors(partitionInfo, vectors);
             }
             if (indexMapping != null) {
-                vectors = VectorMappingUtils.createIndexMappedVectors(indexMapping, vectors);
+                vectors = VectorMappingUtils.createMappedVectors(indexMapping, vectors);
             }
             return copy(vectors);
         }
diff --git a/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java b/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
index d438bfb0ffe9e..3288276a1f649 100644
--- a/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
+++ b/paimon-common/src/main/java/org/apache/paimon/table/SpecialFields.java
@@ -99,6 +99,10 @@ public static boolean isSystemField(String field) {
         return field.startsWith(KEY_FIELD_PREFIX) || SYSTEM_FIELD_NAMES.contains(field);
     }
 
+    public static boolean isKeyField(String field) {
+        return field.startsWith(KEY_FIELD_PREFIX);
+    }
+
     // ----------------------------------------------------------------------------------------
     // Structured type fields
     // ----------------------------------------------------------------------------------------
diff --git a/paimon-common/src/main/java/org/apache/paimon/utils/VectorMappingUtils.java b/paimon-common/src/main/java/org/apache/paimon/utils/VectorMappingUtils.java
index 8b01e644de576..02b011a2f1cf3 100644
--- a/paimon-common/src/main/java/org/apache/paimon/utils/VectorMappingUtils.java
+++ b/paimon-common/src/main/java/org/apache/paimon/utils/VectorMappingUtils.java
@@ -97,8 +97,7 @@ public static ColumnVector createFixedVector(
         return dataType.accept(visitor);
     }
 
-    public static ColumnVector[] createIndexMappedVectors(
-            int[] indexMapping, ColumnVector[] vectors) {
+    public static ColumnVector[] createMappedVectors(int[] indexMapping, ColumnVector[] vectors) {
         ColumnVector[] newVectors = new ColumnVector[indexMapping.length];
         for (int i = 0; i < indexMapping.length; i++) {
             int realIndex = indexMapping[i];
diff --git a/paimon-common/src/test/java/org/apache/paimon/utils/VectorMappingUtilsTest.java b/paimon-common/src/test/java/org/apache/paimon/utils/VectorMappingUtilsTest.java
index c5fac9c880db9..571a0d7189d6c 100644
--- a/paimon-common/src/test/java/org/apache/paimon/utils/VectorMappingUtilsTest.java
+++ b/paimon-common/src/test/java/org/apache/paimon/utils/VectorMappingUtilsTest.java
@@ -82,7 +82,7 @@ public void testCreateIndexMappedVectors() {
         int[] mapping = new int[] {0, 2, 1, 3, 2, 3, 1, 0, 4};
 
         ColumnVector[] newColumnVectors =
-                VectorMappingUtils.createIndexMappedVectors(mapping, columnVectors);
+                VectorMappingUtils.createMappedVectors(mapping, columnVectors);
 
         for (int i = 0; i < mapping.length; i++) {
             Assertions.assertThat(newColumnVectors[i]).isEqualTo(columnVectors[mapping[i]]);
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java b/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
index d2559fe6240b2..16fad55a49a27 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/DataFileRecordReader.java
@@ -76,6 +76,7 @@ public FileRecordIterator<InternalRow> readBatch() throws IOException {
                         PartitionSettedRow.from(partitionInfo);
                 iterator = iterator.transform(partitionSettedRow::replaceRow);
             }
+
             if (indexMapping != null) {
                 final ProjectedRow projectedRow = ProjectedRow.from(indexMapping);
                 iterator = iterator.transform(projectedRow::replaceRow);
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java b/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java
index 037622f95f1e6..58ef924df1786 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java
@@ -26,6 +26,7 @@
 import org.apache.paimon.schema.IndexCastMapping;
 import org.apache.paimon.schema.SchemaEvolutionUtil;
 import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataType;
@@ -35,17 +36,25 @@
 import javax.annotation.Nullable;
 
 import java.util.ArrayList;
+import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
+import java.util.Map;
 import java.util.function.Function;
 
 import static org.apache.paimon.predicate.PredicateBuilder.excludePredicateWithFields;
+import static org.apache.paimon.table.SpecialFields.KEY_FIELD_ID_START;
 
 /** Class with index mapping and bulk format. */
 public class BulkFormatMapping {
 
+    // Index mapping from data schema fields to table schema fields, this is used to realize paimon
+    // schema evolution. And it combines trimeedKeyMapping, which maps key fields to the value
+    // fields
     @Nullable private final int[] indexMapping;
+    // help indexMapping to cast different data type
     @Nullable private final CastFieldGetter[] castMapping;
+    // partition fields mapping, add partition fields to the read fields
     @Nullable private final Pair<int[], RowType> partitionPair;
     private final FormatReaderFactory bulkFormat;
     private final TableSchema dataSchema;
@@ -54,11 +63,12 @@ public class BulkFormatMapping {
     public BulkFormatMapping(
             @Nullable int[] indexMapping,
             @Nullable CastFieldGetter[] castMapping,
+            @Nullable int[] trimmedKeyMapping,
             @Nullable Pair<int[], RowType> partitionPair,
             FormatReaderFactory bulkFormat,
             TableSchema dataSchema,
             List<Predicate> dataFilters) {
-        this.indexMapping = indexMapping;
+        this.indexMapping = combine(indexMapping, trimmedKeyMapping);
         this.castMapping = castMapping;
         this.bulkFormat = bulkFormat;
         this.partitionPair = partitionPair;
@@ -66,6 +76,26 @@ public BulkFormatMapping(
         this.dataFilters = dataFilters;
     }
 
+    private int[] combine(@Nullable int[] indexMapping, @Nullable int[] trimmedKeyMapping) {
+        if (indexMapping == null) {
+            return trimmedKeyMapping;
+        }
+        if (trimmedKeyMapping == null) {
+            return indexMapping;
+        }
+
+        int[] combined = new int[indexMapping.length];
+
+        for (int i = 0; i < indexMapping.length; i++) {
+            if (indexMapping[i] < 0) {
+                combined[i] = indexMapping[i];
+            } else {
+                combined[i] = trimmedKeyMapping[indexMapping[i]];
+            }
+        }
+        return combined;
+    }
+
     @Nullable
     public int[] getIndexMapping() {
         return indexMapping;
@@ -112,24 +142,46 @@ public BulkFormatMappingBuilder(
             this.filters = filters;
         }
 
+        /**
+         * There are three steps here to build BulkFormatMapping:
+         *
+         * <p>1. Calculate the readDataFields, which is what we intend to read from the data schema.
+         * Meanwhile, generate the indexCastMapping, which is used to map the index of the
+         * readDataFields to the index of the data schema.
+         *
+         * <p>2. Calculate the mapping to trim _KEY_ fields. For example: we want _KEY_a, _KEY_b,
+         * _FIELD_SEQUENCE, _ROW_KIND, a, b, c, d, e, f, g from the data, but actually we don't need
+         * to read _KEY_a and a, _KEY_b and b the same time, so we need to trim them. So we mapping
+         * it: read before: _KEY_a, _KEY_b, _FIELD_SEQUENCE, _ROW_KIND, a, b, c, d, e, f, g read
+         * after: a, b, _FIELD_SEQUENCE, _ROW_KIND, c, d, e, f, g and the mapping is
+         * [0,1,2,3,0,1,4,5,6,7,8], it converts the [read after] columns to [read before] columns.
+         *
+         * <p>3. We want read much fewer fields than readDataFields, so we kick out the partition
+         * fields. We generate the partitionMappingAndFieldsWithoutPartitionPair which helps reduce
+         * the real read fields and tell us how to map it back.
+         */
         public BulkFormatMapping build(
                 String formatIdentifier, TableSchema tableSchema, TableSchema dataSchema) {
 
-            List<DataField> readDataFields = readDataFields(dataSchema);
-
+            // extract the whole data fields in logic.
+            List<DataField> allDataFields = fieldsExtractor.apply(dataSchema);
+            List<DataField> readDataFields = readDataFields(allDataFields);
             // build index cast mapping
             IndexCastMapping indexCastMapping =
                     SchemaEvolutionUtil.createIndexCastMapping(readTableFields, readDataFields);
 
+            // map from key fields reading to value fields reading
+            Pair<int[], RowType> trimmedKeyPair = trimKeyFields(readDataFields, allDataFields);
+
             // build partition mapping and filter partition fields
             Pair<Pair<int[], RowType>, List<DataField>>
                     partitionMappingAndFieldsWithoutPartitionPair =
-                            PartitionUtils.constructPartitionMapping(dataSchema, readDataFields);
+                            PartitionUtils.constructPartitionMapping(
+                                    dataSchema, trimmedKeyPair.getRight().getFields());
             Pair<int[], RowType> partitionMapping =
                     partitionMappingAndFieldsWithoutPartitionPair.getLeft();
 
-            // build read row type
-            RowType readDataRowType =
+            RowType readRowType =
                     new RowType(partitionMappingAndFieldsWithoutPartitionPair.getRight());
 
             // build read filters
@@ -138,18 +190,55 @@ public BulkFormatMapping build(
             return new BulkFormatMapping(
                     indexCastMapping.getIndexMapping(),
                     indexCastMapping.getCastMapping(),
+                    trimmedKeyPair.getLeft(),
                     partitionMapping,
                     formatDiscover
                             .discover(formatIdentifier)
-                            .createReaderFactory(readDataRowType, readFilters),
+                            .createReaderFactory(readRowType, readFilters),
                     dataSchema,
                     readFilters);
         }
 
-        private List<DataField> readDataFields(TableSchema dataSchema) {
-            List<DataField> dataFields = fieldsExtractor.apply(dataSchema);
+        static Pair<int[], RowType> trimKeyFields(
+                List<DataField> fieldsWithoutPartition, List<DataField> fields) {
+            int[] map = new int[fieldsWithoutPartition.size()];
+            List<DataField> trimmedFields = new ArrayList<>();
+            Map<Integer, DataField> fieldMap = new HashMap<>();
+            Map<Integer, Integer> positionMap = new HashMap<>();
+
+            for (DataField field : fields) {
+                fieldMap.put(field.id(), field);
+            }
+
+            for (int i = 0; i < fieldsWithoutPartition.size(); i++) {
+                DataField field = fieldsWithoutPartition.get(i);
+                boolean keyField = SpecialFields.isKeyField(field.name());
+                int id = keyField ? field.id() - KEY_FIELD_ID_START : field.id();
+                // field in data schema
+                DataField f = fieldMap.get(id);
+
+                if (f != null) {
+                    if (positionMap.containsKey(id)) {
+                        map[i] = positionMap.get(id);
+                    } else {
+                        map[i] = positionMap.computeIfAbsent(id, k -> trimmedFields.size());
+                        // If the target field is not key field, we remain what it is, because it
+                        // may be projected. Example: the target field is a row type, but only read
+                        // the few fields in it. If we simply trimmedFields.add(f), we will read
+                        // more fields than we need.
+                        trimmedFields.add(keyField ? f : field);
+                    }
+                } else {
+                    throw new RuntimeException("Can't find field with id: " + id + " in fields.");
+                }
+            }
+
+            return Pair.of(map, new RowType(trimmedFields));
+        }
+
+        private List<DataField> readDataFields(List<DataField> allDataFields) {
             List<DataField> readDataFields = new ArrayList<>();
-            for (DataField dataField : dataFields) {
+            for (DataField dataField : allDataFields) {
                 readTableFields.stream()
                         .filter(f -> f.id() == dataField.id())
                         .findFirst()
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTest.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTest.java
index 9384eb88824d1..1be5993fb0d08 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestFileMetaTest.java
@@ -452,7 +452,7 @@ public void testIdentifierAfterFullCompaction() throws Exception {
         containSameIdentifyEntryFile(fullCompacted, entryIdentifierExpected);
     }
 
-    @RepeatedTest(1000)
+    @RepeatedTest(10)
     public void testRandomFullCompaction() throws Exception {
         List<ManifestFileMeta> input = new ArrayList<>();
         Set<FileEntry.Identifier> manifestEntrySet = new HashSet<>();
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java
new file mode 100644
index 0000000000000..4d5d6e32e85dc
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java
@@ -0,0 +1,147 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.utils;
+
+import org.apache.paimon.schema.IndexCastMapping;
+import org.apache.paimon.schema.SchemaEvolutionUtil;
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.DataTypes;
+import org.apache.paimon.types.RowType;
+
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/** Test for {@link BulkFormatMapping.BulkFormatMappingBuilder}. */
+public class BulkFormatMappingTest {
+
+    @Test
+    public void testTrimKeyFields() {
+        List<DataField> keyFields = new ArrayList<>();
+        List<DataField> allFields = new ArrayList<>();
+        List<DataField> testFields = new ArrayList<>();
+
+        for (int i = 0; i < 10; i++) {
+            keyFields.add(
+                    new DataField(
+                            SpecialFields.KEY_FIELD_ID_START + i,
+                            SpecialFields.KEY_FIELD_PREFIX + i,
+                            DataTypes.STRING()));
+        }
+
+        allFields.addAll(keyFields);
+        for (int i = 0; i < 20; i++) {
+            allFields.add(new DataField(i, String.valueOf(i), DataTypes.STRING()));
+        }
+
+        testFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 1,
+                        SpecialFields.KEY_FIELD_PREFIX + 1,
+                        DataTypes.STRING()));
+        testFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 3,
+                        SpecialFields.KEY_FIELD_PREFIX + 3,
+                        DataTypes.STRING()));
+        testFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 5,
+                        SpecialFields.KEY_FIELD_PREFIX + 5,
+                        DataTypes.STRING()));
+        testFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 7,
+                        SpecialFields.KEY_FIELD_PREFIX + 7,
+                        DataTypes.STRING()));
+        testFields.add(new DataField(3, String.valueOf(3), DataTypes.STRING()));
+        testFields.add(new DataField(4, String.valueOf(4), DataTypes.STRING()));
+        testFields.add(new DataField(5, String.valueOf(5), DataTypes.STRING()));
+        testFields.add(new DataField(1, String.valueOf(1), DataTypes.STRING()));
+        testFields.add(new DataField(6, String.valueOf(6), DataTypes.STRING()));
+
+        Pair<int[], RowType> res =
+                BulkFormatMapping.BulkFormatMappingBuilder.trimKeyFields(testFields, allFields);
+
+        Assertions.assertThat(res.getKey()).containsExactly(0, 1, 2, 3, 1, 4, 2, 0, 5);
+
+        List<DataField> fields = res.getRight().getFields();
+        Assertions.assertThat(fields.size()).isEqualTo(6);
+        Assertions.assertThat(fields.get(0).id()).isEqualTo(1);
+        Assertions.assertThat(fields.get(1).id()).isEqualTo(3);
+        Assertions.assertThat(fields.get(2).id()).isEqualTo(5);
+        Assertions.assertThat(fields.get(3).id()).isEqualTo(7);
+        Assertions.assertThat(fields.get(4).id()).isEqualTo(4);
+        Assertions.assertThat(fields.get(5).id()).isEqualTo(6);
+    }
+
+    @Test
+    public void testTrimKeyWithIndexMapping() {
+        List<DataField> readTableFields = new ArrayList<>();
+        List<DataField> readDataFields = new ArrayList<>();
+
+        readTableFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 1,
+                        SpecialFields.KEY_FIELD_PREFIX + "a",
+                        DataTypes.STRING()));
+        readTableFields.add(new DataField(0, "0", DataTypes.STRING()));
+        readTableFields.add(new DataField(1, "a", DataTypes.STRING()));
+        readTableFields.add(new DataField(2, "2", DataTypes.STRING()));
+        readTableFields.add(new DataField(3, "3", DataTypes.STRING()));
+
+        readDataFields.add(
+                new DataField(
+                        SpecialFields.KEY_FIELD_ID_START + 1,
+                        SpecialFields.KEY_FIELD_PREFIX + "a",
+                        DataTypes.STRING()));
+        readDataFields.add(new DataField(0, "0", DataTypes.STRING()));
+        readDataFields.add(new DataField(1, "a", DataTypes.STRING()));
+        readDataFields.add(new DataField(3, "3", DataTypes.STRING()));
+
+        // build index cast mapping
+        IndexCastMapping indexCastMapping =
+                SchemaEvolutionUtil.createIndexCastMapping(readTableFields, readDataFields);
+
+        // map from key fields reading to value fields reading
+        Pair<int[], RowType> trimmedKeyPair =
+                BulkFormatMapping.BulkFormatMappingBuilder.trimKeyFields(
+                        readDataFields, readDataFields);
+
+        BulkFormatMapping bulkFormatMapping =
+                new BulkFormatMapping(
+                        indexCastMapping.getIndexMapping(),
+                        indexCastMapping.getCastMapping(),
+                        trimmedKeyPair.getLeft(),
+                        null,
+                        null,
+                        null,
+                        null);
+
+        Assertions.assertThat(bulkFormatMapping.getIndexMapping()).containsExactly(0, 1, 0, -1, 2);
+        List<DataField> trimmed = trimmedKeyPair.getRight().getFields();
+        Assertions.assertThat(trimmed.get(0).id()).isEqualTo(1);
+        Assertions.assertThat(trimmed.get(1).id()).isEqualTo(0);
+        Assertions.assertThat(trimmed.get(2).id()).isEqualTo(3);
+        Assertions.assertThat(trimmed.size()).isEqualTo(3);
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
index 17e63700faac7..d2bb9eb982741 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/TestChangelogDataReadWrite.java
@@ -69,7 +69,7 @@ public class TestChangelogDataReadWrite {
     private static final RowType KEY_TYPE =
             new RowType(singletonList(new DataField(0, "k", new BigIntType())));
     private static final RowType VALUE_TYPE =
-            new RowType(singletonList(new DataField(0, "v", new BigIntType())));
+            new RowType(singletonList(new DataField(1, "v", new BigIntType())));
     private static final RowType PARTITION_TYPE =
             new RowType(singletonList(new DataField(0, "p", new IntType())));
     private static final Comparator<InternalRow> COMPARATOR =
@@ -87,7 +87,7 @@ public List<DataField> keyFields(TableSchema schema) {
                 @Override
                 public List<DataField> valueFields(TableSchema schema) {
                     return Collections.singletonList(
-                            new DataField(0, "v", new org.apache.paimon.types.BigIntType(false)));
+                            new DataField(1, "v", new org.apache.paimon.types.BigIntType(false)));
                 }
             };
 

From c6387a669d6cd0611c352dbfe4d241fea6a6484c Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Tue, 10 Dec 2024 14:41:37 +0800
Subject: [PATCH 131/157] [hive][spark] Support creating external table without
 schema when the table already exists (#4638)

---
 docs/content/spark/sql-ddl.md                 | 29 ++++++-
 docs/content/spark/sql-write.md               | 31 +++++---
 .../apache/paimon/schema/SchemaManager.java   | 54 +++++++++----
 .../org/apache/paimon/hive/HiveCatalog.java   | 10 +--
 .../org/apache/paimon/spark/SparkCatalog.java | 30 ++------
 .../org/apache/paimon/spark/SparkSource.scala |  2 +-
 .../apache/paimon/spark/sql/DDLTestBase.scala |  2 +-
 .../sql/DDLWithHiveCatalogTestBase.scala      | 75 ++++++++++++++-----
 8 files changed, 157 insertions(+), 76 deletions(-)

diff --git a/docs/content/spark/sql-ddl.md b/docs/content/spark/sql-ddl.md
index 638a21a7042aa..cfe105f6ac006 100644
--- a/docs/content/spark/sql-ddl.md
+++ b/docs/content/spark/sql-ddl.md
@@ -156,6 +156,33 @@ CREATE TABLE my_table (
 );
 ```
 
+### Create External Table
+
+When the catalog's `metastore` type is `hive`, if the `location` is specified when creating a table, that table will be considered an external table; otherwise, it will be a managed table. 
+
+When you drop an external table, only the metadata in Hive will be removed, and the actual data files will not be deleted; whereas dropping a managed table will also delete the data.
+
+```sql
+CREATE TABLE my_table (
+    user_id BIGINT,
+    item_id BIGINT,
+    behavior STRING,
+    dt STRING,
+    hh STRING
+) PARTITIONED BY (dt, hh) TBLPROPERTIES (
+    'primary-key' = 'dt,hh,user_id'
+) LOCATION '/path/to/table';
+```
+
+Furthermore, if there is already data stored in the specified location, you can create the table without explicitly specifying the fields, partitions and props or other information. 
+In this case, the new table will inherit them all from the existing table’s metadata. 
+
+However, if you manually specify them, you need to ensure that they are consistent with those of the existing table (props can be a subset). Therefore, it is strongly recommended not to specify them.
+
+```sql
+CREATE TABLE my_table LOCATION '/path/to/table';
+```
+
 ### Create Table As Select
 
 Table can be created and populated by the results of a query, for example, we have a sql like this: `CREATE TABLE table_b AS SELECT id, name FORM table_a`,
@@ -241,7 +268,7 @@ DROP VIEW v1;
 ```
 
 ## Tag
-### Create or Replace Tag
+### Create Or Replace Tag
 Create or replace a tag syntax with the following options.
 - Create a tag with or without the snapshot id and time retention.
 - Create an existed tag is not failed if using `IF NOT EXISTS` syntax.
diff --git a/docs/content/spark/sql-write.md b/docs/content/spark/sql-write.md
index 5f4fa2dabc9f6..c3afcd3754c80 100644
--- a/docs/content/spark/sql-write.md
+++ b/docs/content/spark/sql-write.md
@@ -120,7 +120,17 @@ TRUNCATE TABLE my_table;
 
 ## Update Table
 
-spark supports update PrimitiveType and StructType, for example:
+Updates the column values for the rows that match a predicate. When no predicate is provided, update the column values for all rows. 
+
+Note:
+
+{{< hint info >}}
+
+Update primary key columns is not supported when the target table is a primary key table.
+
+{{< /hint >}}
+
+Spark supports update PrimitiveType and StructType, for example:
 
 ```sql
 -- Syntax
@@ -142,17 +152,22 @@ UPDATE t SET s.c2 = 'a_new' WHERE s.c1 = 1;
 
 ## Delete From Table
 
+Deletes the rows that match a predicate. When no predicate is provided, deletes all rows.
+
 ```sql
 DELETE FROM my_table WHERE currency = 'UNKNOWN';
 ```
 
 ## Merge Into Table
 
-Paimon currently supports Merge Into syntax in Spark 3+, which allow a set of updates, insertions and deletions based on a source table in a single commit.
+Merges a set of updates, insertions and deletions based on a source table into a target table.
+
+Note:
+
+{{< hint info >}}
+
+In update clause, to update primary key columns is not supported when the target table is a primary key table.
 
-{{< hint into >}}
-1. In update clause, to update primary key columns is not supported.
-2. `WHEN NOT MATCHED BY SOURCE` syntax is not supported.
 {{< /hint >}}
 
 **Example: One**
@@ -160,7 +175,6 @@ Paimon currently supports Merge Into syntax in Spark 3+, which allow a set of up
 This is a simple demo that, if a row exists in the target table update it, else insert it.
 
 ```sql
-
 -- Here both source and target tables have the same schema: (a INT, b INT, c STRING), and a is a primary key.
 
 MERGE INTO target
@@ -170,7 +184,6 @@ WHEN MATCHED THEN
 UPDATE SET *
 WHEN NOT MATCHED
 THEN INSERT *
-
 ```
 
 **Example: Two**
@@ -178,7 +191,6 @@ THEN INSERT *
 This is a demo with multiple, conditional clauses.
 
 ```sql
-
 -- Here both source and target tables have the same schema: (a INT, b INT, c STRING), and a is a primary key.
 
 MERGE INTO target
@@ -194,15 +206,12 @@ WHEN NOT MATCHED AND c > 'c9' THEN
    INSERT (a, b, c) VALUES (a, b * 1.1, c)      -- when not matched but meet the condition 3, then transform and insert this row;
 WHEN NOT MATCHED THEN
 INSERT *      -- when not matched, insert this row without any transformation;
-
 ```
 
 ## Streaming Write
 
 {{< hint info >}}
 
-Paimon currently supports Spark 3+ for streaming write.
-
 Paimon Structured Streaming only supports the two `append` and `complete` modes.
 
 {{< /hint >}}
diff --git a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
index 83ddbccfef987..2139dca4a9907 100644
--- a/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/schema/SchemaManager.java
@@ -208,24 +208,18 @@ public TableSchema createTable(Schema schema) throws Exception {
         return createTable(schema, false);
     }
 
-    public TableSchema createTable(Schema schema, boolean ignoreIfExistsSame) throws Exception {
+    public TableSchema createTable(Schema schema, boolean externalTable) throws Exception {
         while (true) {
             Optional<TableSchema> latest = latest();
             if (latest.isPresent()) {
-                TableSchema oldSchema = latest.get();
-                boolean isSame =
-                        Objects.equals(oldSchema.fields(), schema.fields())
-                                && Objects.equals(oldSchema.partitionKeys(), schema.partitionKeys())
-                                && Objects.equals(oldSchema.primaryKeys(), schema.primaryKeys())
-                                && Objects.equals(oldSchema.options(), schema.options());
-                if (ignoreIfExistsSame && isSame) {
-                    return oldSchema;
+                TableSchema latestSchema = latest.get();
+                if (externalTable) {
+                    checkSchemaForExternalTable(latestSchema, schema);
+                    return latestSchema;
+                } else {
+                    throw new IllegalStateException(
+                            "Schema in filesystem exists, creation is not allowed.");
                 }
-
-                throw new IllegalStateException(
-                        "Schema in filesystem exists, please use updating,"
-                                + " latest schema is: "
-                                + oldSchema);
             }
 
             List<DataField> fields = schema.fields();
@@ -254,6 +248,38 @@ public TableSchema createTable(Schema schema, boolean ignoreIfExistsSame) throws
         }
     }
 
+    private void checkSchemaForExternalTable(TableSchema existsSchema, Schema newSchema) {
+        // When creating an external table, if the table already exists in the location, we can
+        // choose not to specify the fields.
+        if (newSchema.fields().isEmpty()
+                // When the fields are explicitly specified, we need check for consistency.
+                || (Objects.equals(existsSchema.fields(), newSchema.fields())
+                        && Objects.equals(existsSchema.partitionKeys(), newSchema.partitionKeys())
+                        && Objects.equals(existsSchema.primaryKeys(), newSchema.primaryKeys()))) {
+            // check for options
+            Map<String, String> existsOptions = existsSchema.options();
+            Map<String, String> newOptions = newSchema.options();
+            newOptions.forEach(
+                    (key, value) -> {
+                        if (!key.equals(Catalog.OWNER_PROP)
+                                && (!existsOptions.containsKey(key)
+                                        || !existsOptions.get(key).equals(value))) {
+                            throw new RuntimeException(
+                                    "New schema's options are not equal to the exists schema's, new schema: "
+                                            + newOptions
+                                            + ", exists schema: "
+                                            + existsOptions);
+                        }
+                    });
+        } else {
+            throw new RuntimeException(
+                    "New schema is not equal to exists schema, new schema: "
+                            + newSchema
+                            + ", exists schema: "
+                            + existsSchema);
+        }
+    }
+
     /** Update {@link SchemaChange}s. */
     public TableSchema commitChanges(SchemaChange... changes) throws Exception {
         return commitChanges(Arrays.asList(changes));
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
index 151e2b4d2c076..c74ede9815465 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveCatalog.java
@@ -720,11 +720,7 @@ protected void createTableImpl(Identifier identifier, Schema schema) {
         try {
             tableSchema = schemaManager(identifier, location).createTable(schema, externalTable);
         } catch (Exception e) {
-            throw new RuntimeException(
-                    "Failed to commit changes of table "
-                            + identifier.getFullName()
-                            + " to underlying files.",
-                    e);
+            throw new RuntimeException("Failed to create table " + identifier.getFullName(), e);
         }
 
         try {
@@ -735,7 +731,9 @@ protected void createTableImpl(Identifier identifier, Schema schema) {
                                             identifier, tableSchema, location, externalTable)));
         } catch (Exception e) {
             try {
-                fileIO.deleteDirectoryQuietly(location);
+                if (!externalTable) {
+                    fileIO.deleteDirectoryQuietly(location);
+                }
             } catch (Exception ee) {
                 LOG.error("Delete directory[{}] fail for table {}", location, identifier, ee);
             }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
index 5ad1b13b7c7b6..d6318c723fe0e 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkCatalog.java
@@ -75,7 +75,6 @@
 import static org.apache.paimon.spark.util.OptionUtils.copyWithSQLConf;
 import static org.apache.paimon.spark.utils.CatalogUtils.checkNamespace;
 import static org.apache.paimon.spark.utils.CatalogUtils.toIdentifier;
-import static org.apache.paimon.utils.Preconditions.checkArgument;
 
 /** Spark {@link TableCatalog} for paimon. */
 public class SparkCatalog extends SparkBaseCatalog implements SupportFunction, SupportView {
@@ -298,26 +297,8 @@ public org.apache.spark.sql.connector.catalog.Table createTable(
             Map<String, String> properties)
             throws TableAlreadyExistsException, NoSuchNamespaceException {
         try {
-            String provider = properties.get(TableCatalog.PROP_PROVIDER);
-            if ((!usePaimon(provider))
-                    && SparkSource.FORMAT_NAMES().contains(provider.toLowerCase())) {
-                Map<String, String> newProperties = new HashMap<>(properties);
-                newProperties.put(TYPE.key(), FORMAT_TABLE.toString());
-                newProperties.put(FILE_FORMAT.key(), provider.toLowerCase());
-                catalog.createTable(
-                        toIdentifier(ident),
-                        toInitialSchema(schema, partitions, newProperties),
-                        false);
-            } else {
-                checkArgument(
-                        usePaimon(provider),
-                        "SparkCatalog can only create paimon table, but current provider is %s",
-                        provider);
-                catalog.createTable(
-                        toIdentifier(ident),
-                        toInitialSchema(schema, partitions, properties),
-                        false);
-            }
+            catalog.createTable(
+                    toIdentifier(ident), toInitialSchema(schema, partitions, properties), false);
             return loadTable(ident);
         } catch (Catalog.TableAlreadyExistException e) {
             throw new TableAlreadyExistsException(ident);
@@ -406,9 +387,12 @@ private static SchemaChange.Move getMove(
     private Schema toInitialSchema(
             StructType schema, Transform[] partitions, Map<String, String> properties) {
         Map<String, String> normalizedProperties = new HashMap<>(properties);
-        if (!normalizedProperties.containsKey(TableCatalog.PROP_PROVIDER)) {
-            normalizedProperties.put(TableCatalog.PROP_PROVIDER, SparkSource.NAME());
+        String provider = properties.get(TableCatalog.PROP_PROVIDER);
+        if (!usePaimon(provider) && SparkSource.FORMAT_NAMES().contains(provider.toLowerCase())) {
+            normalizedProperties.put(TYPE.key(), FORMAT_TABLE.toString());
+            normalizedProperties.put(FILE_FORMAT.key(), provider.toLowerCase());
         }
+        normalizedProperties.remove(TableCatalog.PROP_PROVIDER);
         normalizedProperties.remove(PRIMARY_KEY_IDENTIFIER);
         normalizedProperties.remove(TableCatalog.PROP_COMMENT);
         if (normalizedProperties.containsKey(TableCatalog.PROP_LOCATION)) {
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkSource.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkSource.scala
index 0170a29f68d36..d80d7350a6554 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkSource.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/SparkSource.scala
@@ -118,7 +118,7 @@ object SparkSource {
 
   val NAME = "paimon"
 
-  val FORMAT_NAMES = Seq("csv", "orc", "parquet")
+  val FORMAT_NAMES: Seq[String] = Seq("csv", "orc", "parquet")
 
   def toBaseRelation(table: FileStoreTable, _sqlContext: SQLContext): BaseRelation = {
     new BaseRelation {
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
index 6ad5274496a90..3ed2c98306fb3 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLTestBase.scala
@@ -161,7 +161,7 @@ abstract class DDLTestBase extends PaimonSparkTestBase {
   test("Paimon DDL: create table without using paimon") {
     withTable("paimon_tbl") {
       sql("CREATE TABLE paimon_tbl (id int)")
-      assert(loadTable("paimon_tbl").options().get("provider").equals("paimon"))
+      assert(!loadTable("paimon_tbl").options().containsKey("provider"))
     }
   }
 
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
index e99e4434ef7f1..1189f1f2906b3 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DDLWithHiveCatalogTestBase.scala
@@ -326,13 +326,7 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
                 spark.sql(
                   s"CREATE TABLE external_tbl (id INT) USING paimon LOCATION '$expertTbLocation'")
                 checkAnswer(spark.sql("SELECT * FROM external_tbl"), Row(1))
-                assert(
-                  loadTable("paimon_db", "external_tbl")
-                    .location()
-                    .toString
-                    .split(':')
-                    .apply(1)
-                    .equals(expertTbLocation))
+                assert(getActualTableLocation("paimon_db", "external_tbl").equals(expertTbLocation))
 
                 // create managed table
                 spark.sql(s"CREATE TABLE managed_tbl (id INT) USING paimon")
@@ -373,12 +367,8 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
                 spark.sql("ALTER TABLE external_tbl RENAME TO external_tbl_renamed")
                 checkAnswer(spark.sql("SELECT * FROM external_tbl_renamed"), Row(1))
                 assert(
-                  loadTable("paimon_db", "external_tbl_renamed")
-                    .location()
-                    .toString
-                    .split(':')
-                    .apply(1)
-                    .equals(expertTbLocation))
+                  getActualTableLocation("paimon_db", "external_tbl_renamed").equals(
+                    expertTbLocation))
 
                 // create managed table
                 spark.sql(s"CREATE TABLE managed_tbl (id INT) USING paimon")
@@ -389,12 +379,55 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
                 spark.sql("ALTER TABLE managed_tbl RENAME TO managed_tbl_renamed")
                 checkAnswer(spark.sql("SELECT * FROM managed_tbl_renamed"), Row(1))
                 assert(
-                  !loadTable("paimon_db", "managed_tbl_renamed")
-                    .location()
-                    .toString
-                    .split(':')
-                    .apply(1)
-                    .equals(managedTbLocation.toString))
+                  !getActualTableLocation("paimon_db", "managed_tbl_renamed").equals(
+                    managedTbLocation.toString))
+              }
+            }
+        }
+    }
+  }
+
+  test("Paimon DDL with hive catalog: create external table without schema") {
+    Seq(sparkCatalogName, paimonHiveCatalogName).foreach {
+      catalogName =>
+        spark.sql(s"USE $catalogName")
+        withTempDir {
+          tbLocation =>
+            withDatabase("paimon_db") {
+              spark.sql(s"CREATE DATABASE IF NOT EXISTS paimon_db")
+              spark.sql(s"USE paimon_db")
+              withTable("t1", "t2", "t3", "t4", "t5") {
+                val expertTbLocation = tbLocation.getCanonicalPath
+                spark.sql(s"""
+                             |CREATE TABLE t1 (id INT, pt INT) USING paimon
+                             |PARTITIONED BY (pt)
+                             |TBLPROPERTIES('primary-key' = 'id', 'k1' = 'v1')
+                             |LOCATION '$expertTbLocation'
+                             |""".stripMargin)
+                spark.sql("INSERT INTO t1 VALUES (1, 1)")
+
+                // create table without schema
+                spark.sql(s"CREATE TABLE t2 USING paimon LOCATION '$expertTbLocation'")
+                checkAnswer(spark.sql("SELECT * FROM t2"), Row(1, 1))
+                assert(getActualTableLocation("paimon_db", "t2").equals(expertTbLocation))
+
+                // create table with wrong schema
+                intercept[Exception] {
+                  spark.sql(
+                    s"CREATE TABLE t3 (fake_col INT) USING paimon LOCATION '$expertTbLocation'")
+                }
+
+                // create table with exists props
+                spark.sql(
+                  s"CREATE TABLE t4 USING paimon TBLPROPERTIES ('k1' = 'v1') LOCATION '$expertTbLocation'")
+                checkAnswer(spark.sql("SELECT * FROM t4"), Row(1, 1))
+                assert(getActualTableLocation("paimon_db", "t4").equals(expertTbLocation))
+
+                // create table with new props
+                intercept[Exception] {
+                  spark.sql(
+                    s"CREATE TABLE t5 USING paimon TBLPROPERTIES ('k2' = 'v2') LOCATION '$expertTbLocation'")
+                }
               }
             }
         }
@@ -445,4 +478,8 @@ abstract class DDLWithHiveCatalogTestBase extends PaimonHiveTestBase {
       .toMap
     tableProps("path").split(":")(1)
   }
+
+  def getActualTableLocation(dbName: String, tblName: String): String = {
+    loadTable(dbName, tblName).location().toString.split(':').apply(1)
+  }
 }

From f8c33c5d72cbe16977ca842f41bfb8a3e32285f7 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Tue, 10 Dec 2024 15:01:43 +0800
Subject: [PATCH 132/157] [hotfix] Fix flaky test of orc tests in
 ArrowBatchConverterTest (#4673)

---
 .../paimon/arrow/converter/ArrowBatchConverterTest.java      | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/paimon-arrow/src/test/java/org/apache/paimon/arrow/converter/ArrowBatchConverterTest.java b/paimon-arrow/src/test/java/org/apache/paimon/arrow/converter/ArrowBatchConverterTest.java
index c726283f0044b..aef589d912423 100644
--- a/paimon-arrow/src/test/java/org/apache/paimon/arrow/converter/ArrowBatchConverterTest.java
+++ b/paimon-arrow/src/test/java/org/apache/paimon/arrow/converter/ArrowBatchConverterTest.java
@@ -910,8 +910,9 @@ private boolean isVectorizedWithDv(RecordReader.RecordIterator<InternalRow> iter
 
     private Object[] randomRowValues(boolean[] nullable) {
         Object[] values = new Object[18];
-        values[0] = BinaryString.fromString(StringUtils.getRandomString(RND, 10, 10));
-        values[1] = BinaryString.fromString(StringUtils.getRandomString(RND, 1, 20));
+        // The orc char reader will trim the string. See TreeReaderFactory.CharTreeReader
+        values[0] = BinaryString.fromString(StringUtils.getRandomString(RND, 9, 9) + "A");
+        values[1] = BinaryString.fromString(StringUtils.getRandomString(RND, 1, 19) + "A");
         values[2] = RND.nextBoolean();
         values[3] = randomBytes(10, 10);
         values[4] = randomBytes(1, 20);

From 7400979e0a3988fc72298c1bbcf762921c307e78 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Tue, 10 Dec 2024 16:00:42 +0800
Subject: [PATCH 133/157] [orc] Row group filter push down cannot work with
 bitmap index

---
 .../apache/paimon/format/FormatReaderContext.java   |  1 +
 .../apache/paimon/format/FormatReaderFactory.java   |  3 +++
 .../java/org/apache/orc/impl/RecordReaderImpl.java  |  4 +++-
 .../apache/paimon/format/orc/OrcReaderFactory.java  | 13 ++++++++-----
 4 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderContext.java b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderContext.java
index 0d3dd7c79ff31..cae6a977e6152 100644
--- a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderContext.java
+++ b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderContext.java
@@ -60,6 +60,7 @@ public long fileSize() {
         return fileSize;
     }
 
+    @Nullable
     @Override
     public FileIndexResult fileIndex() {
         return fileIndexResult;
diff --git a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
index d8af3e2fe37ca..5ef084ec4d344 100644
--- a/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
+++ b/paimon-common/src/main/java/org/apache/paimon/format/FormatReaderFactory.java
@@ -25,6 +25,8 @@
 import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 
+import javax.annotation.Nullable;
+
 import java.io.IOException;
 
 /** A factory to create {@link RecordReader} for file. */
@@ -41,6 +43,7 @@ interface Context {
 
         long fileSize();
 
+        @Nullable
         FileIndexResult fileIndex();
     }
 }
diff --git a/paimon-format/src/main/java/org/apache/orc/impl/RecordReaderImpl.java b/paimon-format/src/main/java/org/apache/orc/impl/RecordReaderImpl.java
index 6c3af4e50043f..93aa0719caea5 100644
--- a/paimon-format/src/main/java/org/apache/orc/impl/RecordReaderImpl.java
+++ b/paimon-format/src/main/java/org/apache/orc/impl/RecordReaderImpl.java
@@ -62,6 +62,8 @@
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import javax.annotation.Nullable;
+
 import java.io.IOException;
 import java.math.BigDecimal;
 import java.sql.Timestamp;
@@ -127,7 +129,7 @@ public class RecordReaderImpl implements RecordReader {
     private final boolean noSelectedVector;
     // identifies whether the file has bad bloom filters that we should not use.
     private final boolean skipBloomFilters;
-    private final FileIndexResult fileIndexResult;
+    @Nullable private final FileIndexResult fileIndexResult;
     static final String[] BAD_CPP_BLOOM_FILTER_VERSIONS = {
         "1.6.0", "1.6.1", "1.6.2", "1.6.3", "1.6.4", "1.6.5", "1.6.6", "1.6.7", "1.6.8", "1.6.9",
         "1.6.10", "1.6.11", "1.7.0"
diff --git a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
index ee0f8a55c0346..db17357bfd705 100644
--- a/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
+++ b/paimon-format/src/main/java/org/apache/paimon/format/orc/OrcReaderFactory.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.data.columnar.ColumnarRowIterator;
 import org.apache.paimon.data.columnar.VectorizedColumnBatch;
 import org.apache.paimon.fileindex.FileIndexResult;
+import org.apache.paimon.fileindex.bitmap.BitmapIndexResult;
 import org.apache.paimon.format.FormatReaderFactory;
 import org.apache.paimon.format.OrcFormatReaderContext;
 import org.apache.paimon.format.fs.HadoopReadOnlyFileSystem;
@@ -258,7 +259,7 @@ private static RecordReader createRecordReader(
             org.apache.paimon.fs.Path path,
             long splitStart,
             long splitLength,
-            FileIndexResult fileIndexResult,
+            @Nullable FileIndexResult fileIndexResult,
             boolean deletionVectorsEnabled)
             throws IOException {
         org.apache.orc.Reader orcReader = createReader(conf, fileIO, path, fileIndexResult);
@@ -276,9 +277,11 @@ private static RecordReader createRecordReader(
                             .skipCorruptRecords(OrcConf.SKIP_CORRUPT_DATA.getBoolean(conf))
                             .tolerateMissingSchema(
                                     OrcConf.TOLERATE_MISSING_SCHEMA.getBoolean(conf));
-            if (!conjunctPredicates.isEmpty() && !deletionVectorsEnabled) {
-                // deletion vectors can not enable this feature, cased by getRowNumber would be
-                // changed.
+            if (!conjunctPredicates.isEmpty()
+                    && !deletionVectorsEnabled
+                    && !(fileIndexResult instanceof BitmapIndexResult)) {
+                // row group filter push down will make row number change incorrect
+                // so deletion vectors mode and bitmap index cannot work with row group push down
                 options.useSelected(OrcConf.READER_USE_SELECTED.getBoolean(conf));
                 options.allowSARGToFilter(OrcConf.ALLOW_SARG_TO_FILTER.getBoolean(conf));
             }
@@ -342,7 +345,7 @@ public static org.apache.orc.Reader createReader(
             org.apache.hadoop.conf.Configuration conf,
             FileIO fileIO,
             org.apache.paimon.fs.Path path,
-            FileIndexResult fileIndexResult)
+            @Nullable FileIndexResult fileIndexResult)
             throws IOException {
         // open ORC file and create reader
         org.apache.hadoop.fs.Path hPath = new org.apache.hadoop.fs.Path(path.toUri());

From 84eadce2b95eec0c36fe13dde10958080cd80f28 Mon Sep 17 00:00:00 2001
From: Giannis Polyzos <ipolyzos.se@gmail.com>
Date: Tue, 10 Dec 2024 10:12:30 +0200
Subject: [PATCH 134/157] [docs] add glue metastore repo for iceberg
 compability (#4674)

---
 docs/content/migration/iceberg-compatibility.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/content/migration/iceberg-compatibility.md b/docs/content/migration/iceberg-compatibility.md
index 54018b073f91f..b6fcaa2826155 100644
--- a/docs/content/migration/iceberg-compatibility.md
+++ b/docs/content/migration/iceberg-compatibility.md
@@ -397,6 +397,7 @@ you also need to set some (or all) of the following table options when creating
 You can use Hive Catalog to connect AWS Glue metastore, you can use set `'metadata.iceberg.hive-client-class'` to
 `'com.amazonaws.glue.catalog.metastore.AWSCatalogMetastoreClient'`.
 
+> **Note:** You can use this [repo](https://github.com/promotedai/aws-glue-data-catalog-client-for-apache-hive-metastore) to build the required jar, include it in your path and configure the AWSCatalogMetastoreClient.
 ## AWS Athena
 
 AWS Athena may use old manifest reader to read Iceberg manifest by names, we should let Paimon producing legacy Iceberg

From 90a37c8b81ed8c2ec38703909c3559ae83630466 Mon Sep 17 00:00:00 2001
From: Yujiang Zhong <42907416+zhongyujiang@users.noreply.github.com>
Date: Tue, 10 Dec 2024 16:15:16 +0800
Subject: [PATCH 135/157] [core] Improve fault tolerance for data spill to
 disk. (#4675)

---
 .../paimon/disk/FileChannelManagerImpl.java   | 22 ++++++++++++++-----
 1 file changed, 16 insertions(+), 6 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/disk/FileChannelManagerImpl.java b/paimon-core/src/main/java/org/apache/paimon/disk/FileChannelManagerImpl.java
index ce175e90bbd1e..99690d426fb52 100644
--- a/paimon-core/src/main/java/org/apache/paimon/disk/FileChannelManagerImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/disk/FileChannelManagerImpl.java
@@ -29,7 +29,9 @@
 import java.io.File;
 import java.io.IOException;
 import java.io.UncheckedIOException;
+import java.util.ArrayList;
 import java.util.Arrays;
+import java.util.List;
 import java.util.Random;
 import java.util.UUID;
 import java.util.concurrent.atomic.AtomicLong;
@@ -63,24 +65,32 @@ public FileChannelManagerImpl(String[] tempDirs, String prefix) {
     }
 
     private static File[] createFiles(String[] tempDirs, String prefix) {
-        File[] files = new File[tempDirs.length];
+        List<File> filesList = new ArrayList<>();
         for (int i = 0; i < tempDirs.length; i++) {
             File baseDir = new File(tempDirs[i]);
             String subfolder = String.format("paimon-%s-%s", prefix, UUID.randomUUID());
             File storageDir = new File(baseDir, subfolder);
 
             if (!storageDir.exists() && !storageDir.mkdirs()) {
-                throw new RuntimeException(
-                        "Could not create storage directory for FileChannelManager: "
-                                + storageDir.getAbsolutePath());
+                LOG.warn(
+                        "Failed to create directory {}, temp directory {} will not be used",
+                        storageDir.getAbsolutePath(),
+                        tempDirs[i]);
+                continue;
             }
-            files[i] = storageDir;
+
+            filesList.add(storageDir);
 
             LOG.debug(
                     "FileChannelManager uses directory {} for spill files.",
                     storageDir.getAbsolutePath());
         }
-        return files;
+
+        if (filesList.isEmpty()) {
+            throw new RuntimeException("No available temporary directories");
+        }
+
+        return filesList.toArray(new File[0]);
     }
 
     @Override

From 2eeed7d00102e765721464795bf786b8d0b506c5 Mon Sep 17 00:00:00 2001
From: yangjf2019 <54518670+yangjf2019@users.noreply.github.com>
Date: Tue, 10 Dec 2024 18:58:03 +0800
Subject: [PATCH 136/157] [doc] updated url links in documentation (#4679)

---
 docs/content/flink/sql-write.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 60c0f5c36c529..408c8e209e65f 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -176,8 +176,8 @@ PARTITION (k0 = 0, k1 = 0) SELECT v FROM my_table WHERE false;
 {{< hint info >}}
 Important table properties setting:
 1. Only [primary key table]({{< ref "primary-key-table/overview" >}}) supports this feature.
-2. [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine#deduplicate" >}})
-   or [partial-update]({{< ref "primary-key-table/merge-engine#partial-update" >}}) to support this feature.
+2. [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine/overview/#deduplicate" >}})
+   or [partial-update]({{< ref "primary-key-table/merge-engine/partial-update/" >}}) to support this feature.
 3. Do not support updating primary keys.
 {{< /hint >}}
 
@@ -211,9 +211,9 @@ UPDATE my_table SET b = 1, c = 2 WHERE a = 'myTable';
 {{< hint info >}}
 Important table properties setting:
 1. Only primary key tables support this feature.
-2. If the table has primary keys, the following [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) support this feature:
-   * [deduplicate]({{< ref "primary-key-table/merge-engine#deduplicate" >}}).
-   * [partial-update]({{< ref "primary-key-table/merge-engine#partial-update" >}}) with option 'partial-update.remove-record-on-delete' enabled.
+2. If the table has primary keys, the following [MergeEngine]({{< ref "primary-key-table/merge-engine/overview/" >}}) support this feature:
+   * [deduplicate]({{< ref "primary-key-table/merge-engine/overview/#deduplicate" >}}).
+   * [partial-update]({{< ref "primary-key-table/merge-engine/partial-update/" >}}) with option 'partial-update.remove-record-on-delete' enabled.
 3. Do not support deleting from table in streaming mode.
 {{< /hint >}}
 

From 6010e615fdc99320b8dd6e9f52d70bfdc98174a5 Mon Sep 17 00:00:00 2001
From: yuzelin <33053040+yuzelin@users.noreply.github.com>
Date: Tue, 10 Dec 2024 21:35:56 +0800
Subject: [PATCH 137/157] [hotfix] CloneAction throw more clear exception when
 no table in source catalog (#4682)

---
 .../flink/clone/CloneSourceBuilder.java       |  3 ++
 .../flink/action/CloneActionITCase.java       | 43 +++++++++++++++++++
 2 files changed, 46 insertions(+)

diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/CloneSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/CloneSourceBuilder.java
index a0f4ef33dee28..585c73cb952cc 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/CloneSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/clone/CloneSourceBuilder.java
@@ -34,6 +34,7 @@
 import java.util.Map;
 
 import static org.apache.paimon.utils.Preconditions.checkArgument;
+import static org.apache.paimon.utils.Preconditions.checkState;
 
 /**
  * Pick the tables to be cloned based on the user input parameters. The record type of the build
@@ -114,6 +115,8 @@ private DataStream<Tuple2<String, String>> build(Catalog sourceCatalog) throws E
                             database + "." + tableName, targetDatabase + "." + targetTableName));
         }
 
+        checkState(!result.isEmpty(), "Didn't find any table in source catalog.");
+
         if (LOG.isDebugEnabled()) {
             LOG.debug("The clone identifiers of source table and target table are: {}", result);
         }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CloneActionITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CloneActionITCase.java
index 71672551abcba..a55b01cc203be 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CloneActionITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/action/CloneActionITCase.java
@@ -32,6 +32,7 @@
 import org.apache.flink.table.api.config.TableConfigOptions;
 import org.apache.flink.types.Row;
 import org.apache.flink.util.CloseableIterator;
+import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.Timeout;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.ValueSource;
@@ -44,8 +45,10 @@
 import java.util.stream.Collectors;
 import java.util.stream.IntStream;
 
+import static org.apache.paimon.testutils.assertj.PaimonAssertions.anyCauseMatches;
 import static org.apache.paimon.utils.Preconditions.checkState;
 import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
 
 /** IT cases for {@link CloneAction}. */
 public class CloneActionITCase extends ActionITCaseBase {
@@ -640,6 +643,46 @@ public void testCloneTableWithExpiration(String invoker) throws Exception {
                 .isEqualTo(Collections.singletonList("+I[1]"));
     }
 
+    // ------------------------------------------------------------------------
+    //  Negative Tests
+    // ------------------------------------------------------------------------
+
+    @Test
+    public void testEmptySourceCatalog() {
+        String sourceWarehouse = getTempDirPath("source-ware");
+
+        TableEnvironment tEnv = tableEnvironmentBuilder().batchMode().parallelism(1).build();
+        tEnv.executeSql(
+                "CREATE CATALOG sourcecat WITH (\n"
+                        + "  'type' = 'paimon',\n"
+                        + String.format("  'warehouse' = '%s'\n", sourceWarehouse)
+                        + ")");
+
+        String targetWarehouse = getTempDirPath("target-ware");
+
+        String[] args =
+                new String[] {
+                    "clone",
+                    "--warehouse",
+                    sourceWarehouse,
+                    "--target_warehouse",
+                    targetWarehouse,
+                    "--parallelism",
+                    "1"
+                };
+        CloneAction action = (CloneAction) ActionFactory.createAction(args).get();
+
+        StreamExecutionEnvironment env =
+                streamExecutionEnvironmentBuilder().streamingMode().allowRestart().build();
+        action.withStreamExecutionEnvironment(env);
+
+        assertThatThrownBy(action::run)
+                .satisfies(
+                        anyCauseMatches(
+                                IllegalStateException.class,
+                                "Didn't find any table in source catalog."));
+    }
+
     // ------------------------------------------------------------------------
     //  Utils
     // ------------------------------------------------------------------------

From 5cf4c93791c460cb35bdd53a5e0b512b964781a5 Mon Sep 17 00:00:00 2001
From: YeJunHao <41894543+leaves12138@users.noreply.github.com>
Date: Wed, 11 Dec 2024 15:14:03 +0800
Subject: [PATCH 138/157] [core] Check file size after write bundle of records
 (#4685)

---
 .../java/org/apache/paimon/io/RollingFileWriter.java     | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/RollingFileWriter.java b/paimon-core/src/main/java/org/apache/paimon/io/RollingFileWriter.java
index 109b7574304ed..29b9223b9a372 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/RollingFileWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/RollingFileWriter.java
@@ -64,10 +64,9 @@ public long targetFileSize() {
         return targetFileSize;
     }
 
-    @VisibleForTesting
-    boolean rollingFile() throws IOException {
+    private boolean rollingFile(boolean forceCheck) throws IOException {
         return currentWriter.reachTargetSize(
-                recordCount % CHECK_ROLLING_RECORD_CNT == 0, targetFileSize);
+                forceCheck || recordCount % CHECK_ROLLING_RECORD_CNT == 0, targetFileSize);
     }
 
     @Override
@@ -81,7 +80,7 @@ public void write(T row) throws IOException {
             currentWriter.write(row);
             recordCount += 1;
 
-            if (rollingFile()) {
+            if (rollingFile(false)) {
                 closeCurrentWriter();
             }
         } catch (Throwable e) {
@@ -105,7 +104,7 @@ public void writeBundle(BundleRecords bundle) throws IOException {
             currentWriter.writeBundle(bundle);
             recordCount += bundle.rowCount();
 
-            if (rollingFile()) {
+            if (rollingFile(true)) {
                 closeCurrentWriter();
             }
         } catch (Throwable e) {

From b339693d9a53d680c383cfdfd9075464f31b1261 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Wed, 11 Dec 2024 16:29:03 +0800
Subject: [PATCH 139/157] [doc] Fix links in sql-write

---
 docs/content/flink/sql-write.md                        | 10 +++++-----
 .../content/primary-key-table/merge-engine/overview.md |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/docs/content/flink/sql-write.md b/docs/content/flink/sql-write.md
index 408c8e209e65f..6abbfa01756ce 100644
--- a/docs/content/flink/sql-write.md
+++ b/docs/content/flink/sql-write.md
@@ -176,8 +176,8 @@ PARTITION (k0 = 0, k1 = 0) SELECT v FROM my_table WHERE false;
 {{< hint info >}}
 Important table properties setting:
 1. Only [primary key table]({{< ref "primary-key-table/overview" >}}) supports this feature.
-2. [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine/overview/#deduplicate" >}})
-   or [partial-update]({{< ref "primary-key-table/merge-engine/partial-update/" >}}) to support this feature.
+2. [MergeEngine]({{< ref "primary-key-table/merge-engine" >}}) needs to be [deduplicate]({{< ref "primary-key-table/merge-engine/overview#deduplicate" >}})
+   or [partial-update]({{< ref "primary-key-table/merge-engine/partial-update" >}}) to support this feature.
 3. Do not support updating primary keys.
 {{< /hint >}}
 
@@ -211,9 +211,9 @@ UPDATE my_table SET b = 1, c = 2 WHERE a = 'myTable';
 {{< hint info >}}
 Important table properties setting:
 1. Only primary key tables support this feature.
-2. If the table has primary keys, the following [MergeEngine]({{< ref "primary-key-table/merge-engine/overview/" >}}) support this feature:
-   * [deduplicate]({{< ref "primary-key-table/merge-engine/overview/#deduplicate" >}}).
-   * [partial-update]({{< ref "primary-key-table/merge-engine/partial-update/" >}}) with option 'partial-update.remove-record-on-delete' enabled.
+2. If the table has primary keys, the following [MergeEngine]({{< ref "primary-key-table/merge-engine/overview" >}}) support this feature:
+   * [deduplicate]({{< ref "primary-key-table/merge-engine/overview#deduplicate" >}}).
+   * [partial-update]({{< ref "primary-key-table/merge-engine/partial-update" >}}) with option 'partial-update.remove-record-on-delete' enabled.
 3. Do not support deleting from table in streaming mode.
 {{< /hint >}}
 
diff --git a/docs/content/primary-key-table/merge-engine/overview.md b/docs/content/primary-key-table/merge-engine/overview.md
index 9f3b50c398bdc..4d192283aa688 100644
--- a/docs/content/primary-key-table/merge-engine/overview.md
+++ b/docs/content/primary-key-table/merge-engine/overview.md
@@ -3,7 +3,7 @@ title: "Overview"
 weight: 1
 type: docs
 aliases:
-- /primary-key-table/merge-engin/overview.html
+- /primary-key-table/merge-engine/overview.html
 ---
 <!--
 Licensed to the Apache Software Foundation (ASF) under one

From e3edd69e45434facf2f84b978f60018a69a335d9 Mon Sep 17 00:00:00 2001
From: xuzifu666 <1206332514@qq.com>
Date: Wed, 11 Dec 2024 21:48:22 +0800
Subject: [PATCH 140/157] [core] Introduce RollbackToWatermarkProcedure for
 rollback (#4687)

---
 docs/content/flink/procedures.md              |  22 ++++
 docs/content/spark/procedures.md              |  11 ++
 .../apache/paimon/utils/SnapshotManager.java  |  59 ++++++++++
 .../RollbackToWatermarkProcedure.java         |  59 ++++++++++
 .../RollbackToWatermarkProcedure.java         |  66 +++++++++++
 .../org.apache.paimon.factories.Factory       |   1 +
 .../RollbackToWatermarkProcedureITCase.java   |  79 +++++++++++++
 .../apache/paimon/spark/SparkProcedures.java  |   2 +
 .../RollbackToWatermarkProcedure.java         | 105 ++++++++++++++++++
 9 files changed, 404 insertions(+)
 create mode 100644 paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedureITCase.java
 create mode 100644 paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RollbackToWatermarkProcedure.java

diff --git a/docs/content/flink/procedures.md b/docs/content/flink/procedures.md
index 59b02f82bf8c0..7a9b238073921 100644
--- a/docs/content/flink/procedures.md
+++ b/docs/content/flink/procedures.md
@@ -412,6 +412,28 @@ All available procedures are listed below.
          CALL sys.rollback_to_timestamp(`table` => 'default.T', timestamp => 1730292023000)
       </td>
    </tr>
+   <tr>
+          <td>rollback_to_watermark</td>
+      <td>
+         -- for Flink 1.18<br/>
+         -- rollback to the snapshot which earlier or equal than watermark.<br/>
+         CALL sys.rollback_to_watermark('identifier', watermark)<br/><br/>
+         -- for Flink 1.19 and later<br/>
+         -- rollback to the snapshot which earlier or equal than watermark.<br/>
+         CALL sys.rollback_to_watermark(`table` => 'default.T', `watermark` => watermark)<br/><br/>
+      </td>
+      <td>
+         To rollback to the snapshot which earlier or equal than watermark. Argument:
+            <li>identifier: the target table identifier. Cannot be empty.</li>
+            <li>watermark (Long): Roll back to the snapshot which earlier or equal than watermark.</li>
+      </td>
+      <td>
+         -- for Flink 1.18<br/>
+         CALL sys.rollback_to_watermark('default.T', 1730292023000)
+         -- for Flink 1.19 and later<br/>
+         CALL sys.rollback_to_watermark(`table` => 'default.T', watermark => 1730292023000)
+      </td>
+   </tr>
    <tr>
       <td>expire_snapshots</td>
       <td>
diff --git a/docs/content/spark/procedures.md b/docs/content/spark/procedures.md
index 88d46fabbb2bc..5b0efd5f90a66 100644
--- a/docs/content/spark/procedures.md
+++ b/docs/content/spark/procedures.md
@@ -179,6 +179,17 @@ This section introduce all available spark procedures about paimon.
           CALL sys.rollback_to_timestamp(table => 'default.T', timestamp => 1730292023000)<br/><br/>
       </td>
     </tr>
+    <tr>
+      <td>rollback_to_watermark</td>
+      <td>
+         To rollback to the snapshot which earlier or equal than watermark. Argument:
+            <li>table: the target table identifier. Cannot be empty.</li>
+            <li>watermark: roll back to the snapshot which earlier or equal than watermark.</li>
+      </td>
+      <td>
+          CALL sys.rollback_to_watermark(table => 'default.T', watermark => 1730292023000)<br/><br/>
+      </td>
+    </tr>
     <tr>
       <td>migrate_database</td>
       <td>
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
index cbe33ffaf4569..eb7333366fece 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
@@ -366,6 +366,65 @@ private Snapshot changelogOrSnapshot(long snapshotId) {
         return finalSnapshot;
     }
 
+    public @Nullable Snapshot earlierOrEqualWatermark(long watermark) {
+        Long earliest = earliestSnapshotId();
+        Long latest = latestSnapshotId();
+        // If latest == Long.MIN_VALUE don't need next binary search for watermark
+        // which can reduce IO cost with snapshot
+        if (earliest == null || latest == null || snapshot(latest).watermark() == Long.MIN_VALUE) {
+            return null;
+        }
+        Long earliestWatermark = null;
+        // find the first snapshot with watermark
+        if ((earliestWatermark = snapshot(earliest).watermark()) == null) {
+            while (earliest < latest) {
+                earliest++;
+                earliestWatermark = snapshot(earliest).watermark();
+                if (earliestWatermark != null) {
+                    break;
+                }
+            }
+        }
+        if (earliestWatermark == null) {
+            return null;
+        }
+
+        if (earliestWatermark >= watermark) {
+            return snapshot(earliest);
+        }
+        Snapshot finalSnapshot = null;
+
+        while (earliest <= latest) {
+            long mid = earliest + (latest - earliest) / 2; // Avoid overflow
+            Snapshot snapshot = snapshot(mid);
+            Long commitWatermark = snapshot.watermark();
+            if (commitWatermark == null) {
+                // find the first snapshot with watermark
+                while (mid >= earliest) {
+                    mid--;
+                    commitWatermark = snapshot(mid).watermark();
+                    if (commitWatermark != null) {
+                        break;
+                    }
+                }
+            }
+            if (commitWatermark == null) {
+                earliest = mid + 1;
+            } else {
+                if (commitWatermark > watermark) {
+                    latest = mid - 1; // Search in the left half
+                } else if (commitWatermark < watermark) {
+                    earliest = mid + 1; // Search in the right half
+                    finalSnapshot = snapshot;
+                } else {
+                    finalSnapshot = snapshot; // Found the exact match
+                    break;
+                }
+            }
+        }
+        return finalSnapshot;
+    }
+
     public @Nullable Snapshot laterOrEqualWatermark(long watermark) {
         Long earliest = earliestSnapshotId();
         Long latest = latestSnapshotId();
diff --git a/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
new file mode 100644
index 0000000000000..da0b38f16b54b
--- /dev/null
+++ b/paimon-flink/paimon-flink-1.18/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.procedure;
+
+import org.apache.paimon.Snapshot;
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.Table;
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.flink.table.procedure.ProcedureContext;
+
+/**
+ * Rollback to watermark procedure. Usage:
+ *
+ * <pre><code>
+ *  -- rollback to the snapshot which earlier or equal than watermark.
+ *  CALL sys.rollback_to_watermark('tableId', watermark)
+ * </code></pre>
+ */
+public class RollbackToWatermarkProcedure extends ProcedureBase {
+
+    public static final String IDENTIFIER = "rollback_to_watermark";
+
+    public String[] call(ProcedureContext procedureContext, String tableId, long watermark)
+            throws Catalog.TableNotExistException {
+        Preconditions.checkNotNull(tableId, "table can not be empty");
+        Table table = catalog.getTable(Identifier.fromString(tableId));
+        FileStoreTable fileStoreTable = (FileStoreTable) table;
+        Snapshot snapshot = fileStoreTable.snapshotManager().earlierOrEqualWatermark(watermark);
+        Preconditions.checkNotNull(
+                snapshot, String.format("count not find snapshot earlier than %s", watermark));
+        long snapshotId = snapshot.id();
+        fileStoreTable.rollbackTo(snapshotId);
+        return new String[] {String.format("Success roll back to snapshot: %s .", snapshotId)};
+    }
+
+    @Override
+    public String identifier() {
+        return IDENTIFIER;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
new file mode 100644
index 0000000000000..ab1ea8080de97
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedure.java
@@ -0,0 +1,66 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.procedure;
+
+import org.apache.paimon.Snapshot;
+import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.catalog.Identifier;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.Table;
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.flink.table.annotation.ArgumentHint;
+import org.apache.flink.table.annotation.DataTypeHint;
+import org.apache.flink.table.annotation.ProcedureHint;
+import org.apache.flink.table.procedure.ProcedureContext;
+
+/**
+ * Rollback to watermark procedure. Usage:
+ *
+ * <pre><code>
+ *  -- rollback to the snapshot which earlier or equal than watermark.
+ *  CALL sys.rollback_to_watermark(`table` => 'tableId', watermark => watermark)
+ * </code></pre>
+ */
+public class RollbackToWatermarkProcedure extends ProcedureBase {
+
+    public static final String IDENTIFIER = "rollback_to_watermark";
+
+    @ProcedureHint(
+            argument = {
+                @ArgumentHint(name = "table", type = @DataTypeHint("STRING")),
+                @ArgumentHint(name = "watermark", type = @DataTypeHint("BIGINT"))
+            })
+    public String[] call(ProcedureContext procedureContext, String tableId, Long watermark)
+            throws Catalog.TableNotExistException {
+        Table table = catalog.getTable(Identifier.fromString(tableId));
+        FileStoreTable fileStoreTable = (FileStoreTable) table;
+        Snapshot snapshot = fileStoreTable.snapshotManager().earlierOrEqualWatermark(watermark);
+        Preconditions.checkNotNull(
+                snapshot, String.format("count not find snapshot earlier than %s", watermark));
+        long snapshotId = snapshot.id();
+        fileStoreTable.rollbackTo(snapshotId);
+        return new String[] {String.format("Success roll back to snapshot: %s .", snapshotId)};
+    }
+
+    @Override
+    public String identifier() {
+        return IDENTIFIER;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory b/paimon-flink/paimon-flink-common/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
index 0ff3ac1f1e1ca..6c3b0e7664c02 100644
--- a/paimon-flink/paimon-flink-common/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
+++ b/paimon-flink/paimon-flink-common/src/main/resources/META-INF/services/org.apache.paimon.factories.Factory
@@ -61,6 +61,7 @@ org.apache.paimon.flink.procedure.MergeIntoProcedure
 org.apache.paimon.flink.procedure.ResetConsumerProcedure
 org.apache.paimon.flink.procedure.RollbackToProcedure
 org.apache.paimon.flink.procedure.RollbackToTimestampProcedure
+org.apache.paimon.flink.procedure.RollbackToWatermarkProcedure
 org.apache.paimon.flink.procedure.MigrateTableProcedure
 org.apache.paimon.flink.procedure.MigrateDatabaseProcedure
 org.apache.paimon.flink.procedure.MigrateFileProcedure
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedureITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedureITCase.java
new file mode 100644
index 0000000000000..f87ecd24756b2
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/procedure/RollbackToWatermarkProcedureITCase.java
@@ -0,0 +1,79 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.procedure;
+
+import org.apache.paimon.flink.CatalogITCaseBase;
+import org.apache.paimon.table.FileStoreTable;
+
+import org.apache.flink.types.Row;
+import org.junit.jupiter.api.Test;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/** IT Case for {@link RollbackToWatermarkProcedure}. */
+public class RollbackToWatermarkProcedureITCase extends CatalogITCaseBase {
+
+    @Test
+    public void testCreateTagsFromSnapshotsWatermark() throws Exception {
+        sql(
+                "CREATE TABLE T ("
+                        + " k STRING,"
+                        + " dt STRING,"
+                        + " PRIMARY KEY (k, dt) NOT ENFORCED"
+                        + ") PARTITIONED BY (dt) WITH ("
+                        + " 'bucket' = '1'"
+                        + ")");
+
+        // create snapshot 1 with watermark 1000.
+        sql(
+                "insert into T/*+ OPTIONS('end-input.watermark'= '1000') */ values('k1', '2024-12-02')");
+        // create snapshot 2 with watermark 2000.
+        sql(
+                "insert into T/*+ OPTIONS('end-input.watermark'= '2000') */ values('k2', '2024-12-02')");
+        // create snapshot 3 with watermark 3000.
+        sql(
+                "insert into T/*+ OPTIONS('end-input.watermark'= '3000') */ values('k3', '2024-12-02')");
+
+        FileStoreTable table = paimonTable("T");
+
+        long watermark1 = table.snapshotManager().snapshot(1).watermark();
+        long watermark2 = table.snapshotManager().snapshot(2).watermark();
+        long watermark3 = table.snapshotManager().snapshot(3).watermark();
+
+        assertThat(watermark1 == 1000).isTrue();
+        assertThat(watermark2 == 2000).isTrue();
+        assertThat(watermark3 == 3000).isTrue();
+
+        assertThat(sql("select * from T").stream().map(Row::toString))
+                .containsExactlyInAnyOrder(
+                        "+I[k1, 2024-12-02]", "+I[k2, 2024-12-02]", "+I[k3, 2024-12-02]");
+
+        sql("CALL sys.rollback_to_watermark(`table` => 'default.T',`watermark` => 2001)");
+
+        // check for snapshot 2
+        assertThat(sql("select * from T").stream().map(Row::toString))
+                .containsExactlyInAnyOrder("+I[k1, 2024-12-02]", "+I[k2, 2024-12-02]");
+
+        sql("CALL sys.rollback_to_watermark(`table` => 'default.T',`watermark` => 1001)");
+
+        // check for snapshot 1
+        assertThat(sql("select * from T").stream().map(Row::toString))
+                .containsExactlyInAnyOrder("+I[k1, 2024-12-02]");
+    }
+}
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
index 21f14e5d7a38e..b2fa66a150906 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkProcedures.java
@@ -43,6 +43,7 @@
 import org.apache.paimon.spark.procedure.ResetConsumerProcedure;
 import org.apache.paimon.spark.procedure.RollbackProcedure;
 import org.apache.paimon.spark.procedure.RollbackToTimestampProcedure;
+import org.apache.paimon.spark.procedure.RollbackToWatermarkProcedure;
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
 
@@ -72,6 +73,7 @@ private static Map<String, Supplier<ProcedureBuilder>> initProcedureBuilders() {
                 ImmutableMap.builder();
         procedureBuilders.put("rollback", RollbackProcedure::builder);
         procedureBuilders.put("rollback_to_timestamp", RollbackToTimestampProcedure::builder);
+        procedureBuilders.put("rollback_to_watermark", RollbackToWatermarkProcedure::builder);
         procedureBuilders.put("create_tag", CreateTagProcedure::builder);
         procedureBuilders.put("replace_tag", ReplaceTagProcedure::builder);
         procedureBuilders.put("rename_tag", RenameTagProcedure::builder);
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RollbackToWatermarkProcedure.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RollbackToWatermarkProcedure.java
new file mode 100644
index 0000000000000..09185f02c9192
--- /dev/null
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/RollbackToWatermarkProcedure.java
@@ -0,0 +1,105 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.spark.procedure;
+
+import org.apache.paimon.Snapshot;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.spark.sql.catalyst.InternalRow;
+import org.apache.spark.sql.connector.catalog.Identifier;
+import org.apache.spark.sql.connector.catalog.TableCatalog;
+import org.apache.spark.sql.types.Metadata;
+import org.apache.spark.sql.types.StructField;
+import org.apache.spark.sql.types.StructType;
+import org.apache.spark.unsafe.types.UTF8String;
+
+import static org.apache.spark.sql.types.DataTypes.LongType;
+import static org.apache.spark.sql.types.DataTypes.StringType;
+
+/** A procedure to rollback to a watermark. */
+public class RollbackToWatermarkProcedure extends BaseProcedure {
+
+    private static final ProcedureParameter[] PARAMETERS =
+            new ProcedureParameter[] {
+                ProcedureParameter.required("table", StringType),
+                // watermark value
+                ProcedureParameter.required("watermark", LongType)
+            };
+
+    private static final StructType OUTPUT_TYPE =
+            new StructType(
+                    new StructField[] {
+                        new StructField("result", StringType, true, Metadata.empty())
+                    });
+
+    private RollbackToWatermarkProcedure(TableCatalog tableCatalog) {
+        super(tableCatalog);
+    }
+
+    @Override
+    public ProcedureParameter[] parameters() {
+        return PARAMETERS;
+    }
+
+    @Override
+    public StructType outputType() {
+        return OUTPUT_TYPE;
+    }
+
+    @Override
+    public InternalRow[] call(InternalRow args) {
+        Identifier tableIdent = toIdentifier(args.getString(0), PARAMETERS[0].name());
+        Long watermark = args.getLong(1);
+
+        return modifyPaimonTable(
+                tableIdent,
+                table -> {
+                    FileStoreTable fileStoreTable = (FileStoreTable) table;
+                    Snapshot snapshot =
+                            fileStoreTable.snapshotManager().earlierOrEqualWatermark(watermark);
+                    Preconditions.checkNotNull(
+                            snapshot,
+                            String.format("count not find snapshot earlier than %s", watermark));
+                    long snapshotId = snapshot.id();
+                    fileStoreTable.rollbackTo(snapshotId);
+                    InternalRow outputRow =
+                            newInternalRow(
+                                    UTF8String.fromString(
+                                            String.format(
+                                                    "Success roll back to snapshot: %s .",
+                                                    snapshotId)));
+                    return new InternalRow[] {outputRow};
+                });
+    }
+
+    public static ProcedureBuilder builder() {
+        return new BaseProcedure.Builder<RollbackToWatermarkProcedure>() {
+            @Override
+            public RollbackToWatermarkProcedure doBuild() {
+                return new RollbackToWatermarkProcedure(tableCatalog());
+            }
+        };
+    }
+
+    @Override
+    public String description() {
+        return "RollbackToWatermarkProcedure";
+    }
+}

From c0f61e2668b051f226255d4e3a11c965aa258870 Mon Sep 17 00:00:00 2001
From: lining <lining.jln@alibaba-inc.com>
Date: Wed, 11 Dec 2024 22:18:23 +0800
Subject: [PATCH 141/157] [core] Add database API implementation in RESTCatalog
 (#4676)

---
 .../paimon/rest/DefaultErrorHandler.java      |  27 ++-
 .../org/apache/paimon/rest/HttpClient.java    |  24 ++-
 .../org/apache/paimon/rest/RESTCatalog.java   |  45 ++++-
 .../rest/RESTCatalogInternalOptions.java      |   5 +
 .../org/apache/paimon/rest/RESTClient.java    |   2 +
 .../org/apache/paimon/rest/RESTMessage.java   |   3 +
 .../org/apache/paimon/rest/ResourcePaths.java |  11 ++
 .../apache/paimon/rest/auth/AuthSession.java  |  54 +++---
 .../exceptions/AlreadyExistsException.java    |  27 +++
 .../exceptions/NoSuchResourceException.java   |  27 +++
 .../rest/requests/CreateDatabaseRequest.java  |  69 +++++++
 .../rest/requests/DropDatabaseRequest.java    |  56 ++++++
 .../paimon/rest/responses/ConfigResponse.java |  15 +-
 .../responses/CreateDatabaseResponse.java     |  58 ++++++
 .../paimon/rest/responses/DatabaseName.java   |  44 +++++
 .../paimon/rest/responses/ErrorResponse.java  |  20 +-
 .../rest/responses/GetDatabaseResponse.java   |  78 ++++++++
 .../rest/responses/ListDatabasesResponse.java |  45 +++++
 .../paimon/rest/DefaultErrorHandlerTest.java  |   8 +
 .../apache/paimon/rest/HttpClientTest.java    |  14 ++
 .../apache/paimon/rest/MockRESTMessage.java   |  74 +++++++
 .../apache/paimon/rest/RESTCatalogTest.java   |  58 +++++-
 .../paimon/rest/RESTObjectMapperTest.java     |  64 ++++++-
 .../paimon/rest/auth/AuthSessionTest.java     |  18 ++
 paimon-open-api/generate.sh                   |   1 +
 paimon-open-api/rest-catalog-open-api.yaml    | 180 +++++++++++++++++-
 .../open/api/RESTCatalogController.java       | 120 ++++++++++--
 .../paimon/open/api/config/OpenAPIConfig.java |   1 -
 28 files changed, 1070 insertions(+), 78 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/AlreadyExistsException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NoSuchResourceException.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/requests/CreateDatabaseRequest.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/CreateDatabaseResponse.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/DatabaseName.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/GetDatabaseResponse.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/responses/ListDatabasesResponse.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java b/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
index 1a8618c1c603f..ce2cbb56ae248 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/DefaultErrorHandler.java
@@ -18,8 +18,10 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.rest.exceptions.AlreadyExistsException;
 import org.apache.paimon.rest.exceptions.BadRequestException;
 import org.apache.paimon.rest.exceptions.ForbiddenException;
+import org.apache.paimon.rest.exceptions.NoSuchResourceException;
 import org.apache.paimon.rest.exceptions.NotAuthorizedException;
 import org.apache.paimon.rest.exceptions.RESTException;
 import org.apache.paimon.rest.exceptions.ServiceFailureException;
@@ -28,6 +30,7 @@
 
 /** Default error handler. */
 public class DefaultErrorHandler extends ErrorHandler {
+
     private static final ErrorHandler INSTANCE = new DefaultErrorHandler();
 
     public static ErrorHandler getInstance() {
@@ -36,26 +39,32 @@ public static ErrorHandler getInstance() {
 
     @Override
     public void accept(ErrorResponse error) {
-        int code = error.code();
+        int code = error.getCode();
+        String message = error.getMessage();
         switch (code) {
             case 400:
-                throw new BadRequestException(
-                        String.format("Malformed request: %s", error.message()));
+                throw new BadRequestException(String.format("Malformed request: %s", message));
             case 401:
-                throw new NotAuthorizedException("Not authorized: %s", error.message());
+                throw new NotAuthorizedException("Not authorized: %s", message);
             case 403:
-                throw new ForbiddenException("Forbidden: %s", error.message());
+                throw new ForbiddenException("Forbidden: %s", message);
+            case 404:
+                throw new NoSuchResourceException("%s", message);
             case 405:
             case 406:
                 break;
+            case 409:
+                throw new AlreadyExistsException("%s", message);
             case 500:
-                throw new ServiceFailureException("Server error: %s", error.message());
+                throw new ServiceFailureException("Server error: %s", message);
             case 501:
-                throw new UnsupportedOperationException(error.message());
+                throw new UnsupportedOperationException(message);
             case 503:
-                throw new ServiceUnavailableException("Service unavailable: %s", error.message());
+                throw new ServiceUnavailableException("Service unavailable: %s", message);
+            default:
+                break;
         }
 
-        throw new RESTException("Unable to process: %s", error.message());
+        throw new RESTException("Unable to process: %s", message);
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
index e092711e5f971..97696aef09ed3 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
@@ -95,6 +95,23 @@ public <T extends RESTResponse> T post(
         }
     }
 
+    @Override
+    public <T extends RESTResponse> T delete(
+            String path, RESTRequest body, Map<String, String> headers) {
+        try {
+            RequestBody requestBody = buildRequestBody(body);
+            Request request =
+                    new Request.Builder()
+                            .url(uri + path)
+                            .delete(requestBody)
+                            .headers(Headers.of(headers))
+                            .build();
+            return exec(request, null);
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
+    }
+
     @Override
     public void close() throws IOException {
         okHttpClient.dispatcher().cancelAll();
@@ -111,10 +128,13 @@ private <T extends RESTResponse> T exec(Request request, Class<T> responseType)
                                 response.code());
                 errorHandler.accept(error);
             }
-            if (responseBodyStr == null) {
+            if (responseType != null && responseBodyStr != null) {
+                return mapper.readValue(responseBodyStr, responseType);
+            } else if (responseType == null) {
+                return null;
+            } else {
                 throw new RESTException("response body is null.");
             }
-            return mapper.readValue(responseBodyStr, responseType);
         } catch (Exception e) {
             throw new RESTException(e, "rest exception");
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
index f3007bf4bf025..3c2538df0ca28 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
@@ -29,12 +29,21 @@
 import org.apache.paimon.rest.auth.AuthSession;
 import org.apache.paimon.rest.auth.CredentialsProvider;
 import org.apache.paimon.rest.auth.CredentialsProviderFactory;
+import org.apache.paimon.rest.exceptions.AlreadyExistsException;
+import org.apache.paimon.rest.exceptions.NoSuchResourceException;
+import org.apache.paimon.rest.requests.CreateDatabaseRequest;
+import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
+import org.apache.paimon.rest.responses.CreateDatabaseResponse;
+import org.apache.paimon.rest.responses.DatabaseName;
+import org.apache.paimon.rest.responses.GetDatabaseResponse;
+import org.apache.paimon.rest.responses.ListDatabasesResponse;
 import org.apache.paimon.schema.Schema;
 import org.apache.paimon.schema.SchemaChange;
 import org.apache.paimon.table.Table;
 
 import org.apache.paimon.shade.guava30.com.google.common.annotations.VisibleForTesting;
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
 import java.time.Duration;
@@ -42,6 +51,7 @@
 import java.util.Map;
 import java.util.Optional;
 import java.util.concurrent.ScheduledExecutorService;
+import java.util.stream.Collectors;
 
 import static org.apache.paimon.utils.ThreadPoolUtils.createScheduledThreadPool;
 
@@ -113,24 +123,49 @@ public FileIO fileIO() {
 
     @Override
     public List<String> listDatabases() {
-        throw new UnsupportedOperationException();
+        ListDatabasesResponse response =
+                client.get(resourcePaths.databases(), ListDatabasesResponse.class, headers());
+        if (response.getDatabases() != null) {
+            return response.getDatabases().stream()
+                    .map(DatabaseName::getName)
+                    .collect(Collectors.toList());
+        }
+        return ImmutableList.of();
     }
 
     @Override
     public void createDatabase(String name, boolean ignoreIfExists, Map<String, String> properties)
             throws DatabaseAlreadyExistException {
-        throw new UnsupportedOperationException();
+        CreateDatabaseRequest request = new CreateDatabaseRequest(name, ignoreIfExists, properties);
+        try {
+            client.post(
+                    resourcePaths.databases(), request, CreateDatabaseResponse.class, headers());
+        } catch (AlreadyExistsException e) {
+            throw new DatabaseAlreadyExistException(name);
+        }
     }
 
     @Override
     public Database getDatabase(String name) throws DatabaseNotExistException {
-        throw new UnsupportedOperationException();
+        try {
+            GetDatabaseResponse response =
+                    client.get(resourcePaths.database(name), GetDatabaseResponse.class, headers());
+            return new Database.DatabaseImpl(
+                    name, response.options(), response.comment().orElseGet(() -> null));
+        } catch (NoSuchResourceException e) {
+            throw new DatabaseNotExistException(name);
+        }
     }
 
     @Override
     public void dropDatabase(String name, boolean ignoreIfNotExists, boolean cascade)
             throws DatabaseNotExistException, DatabaseNotEmptyException {
-        throw new UnsupportedOperationException();
+        DropDatabaseRequest request = new DropDatabaseRequest(ignoreIfNotExists, cascade);
+        try {
+            client.delete(resourcePaths.database(name), request, headers());
+        } catch (NoSuchResourceException e) {
+            throw new DatabaseNotExistException(name);
+        }
     }
 
     @Override
@@ -208,7 +243,7 @@ public void close() throws Exception {
     Map<String, String> fetchOptionsFromServer(
             Map<String, String> headers, Map<String, String> clientProperties) {
         ConfigResponse response =
-                client.get(ResourcePaths.V1_CONFIG, ConfigResponse.class, headers());
+                client.get(ResourcePaths.V1_CONFIG, ConfigResponse.class, headers);
         return response.merge(clientProperties);
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
index 62a8bf134ae58..722010923c469 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalogInternalOptions.java
@@ -33,4 +33,9 @@ public class RESTCatalogInternalOptions {
                     .stringType()
                     .noDefaultValue()
                     .withDescription("REST Catalog auth credentials provider.");
+    public static final ConfigOption<String> DATABASE_COMMENT =
+            ConfigOptions.key("comment")
+                    .stringType()
+                    .defaultValue(null)
+                    .withDescription("REST Catalog database comment.");
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
index feeed06a417ac..d0244f309ef4b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
@@ -28,4 +28,6 @@ public interface RESTClient extends Closeable {
 
     <T extends RESTResponse> T post(
             String path, RESTRequest body, Class<T> responseType, Map<String, String> headers);
+
+    <T extends RESTResponse> T delete(String path, RESTRequest body, Map<String, String> headers);
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
index 6cb0b6fa6573b..31d46df7ef0ff 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTMessage.java
@@ -18,5 +18,8 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
+
 /** Interface to mark both REST requests and responses. */
+@JsonIgnoreProperties(ignoreUnknown = true)
 public interface RESTMessage {}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
index aaca6193802d8..a6d0000a225b2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
@@ -18,10 +18,13 @@
 
 package org.apache.paimon.rest;
 
+import java.util.StringJoiner;
+
 /** Resource paths for REST catalog. */
 public class ResourcePaths {
 
     public static final String V1_CONFIG = "/api/v1/config";
+    private static final StringJoiner SLASH = new StringJoiner("/");
 
     public static ResourcePaths forCatalogProperties(String prefix) {
         return new ResourcePaths(prefix);
@@ -32,4 +35,12 @@ public static ResourcePaths forCatalogProperties(String prefix) {
     public ResourcePaths(String prefix) {
         this.prefix = prefix;
     }
+
+    public String databases() {
+        return SLASH.add("api").add("v1").add(prefix).add("databases").toString();
+    }
+
+    public String database(String databaseName) {
+        return SLASH.add("api").add("v1").add(prefix).add("databases").add(databaseName).toString();
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java b/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
index 74efb8508a068..3ca7590e5f962 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/auth/AuthSession.java
@@ -33,9 +33,10 @@
 public class AuthSession {
 
     static final int TOKEN_REFRESH_NUM_RETRIES = 5;
+    static final long MIN_REFRESH_WAIT_MILLIS = 10;
+    static final long MAX_REFRESH_WINDOW_MILLIS = 300_000; // 5 minutes
+
     private static final Logger log = LoggerFactory.getLogger(AuthSession.class);
-    private static final long MAX_REFRESH_WINDOW_MILLIS = 300_000; // 5 minutes
-    private static final long MIN_REFRESH_WAIT_MILLIS = 10;
     private final CredentialsProvider credentialsProvider;
     private volatile Map<String, String> headers;
 
@@ -76,12 +77,38 @@ public Map<String, String> getHeaders() {
         return headers;
     }
 
+    public Boolean refresh() {
+        if (this.credentialsProvider.supportRefresh()
+                && this.credentialsProvider.keepRefreshed()
+                && this.credentialsProvider.expiresInMills().isPresent()) {
+            boolean isSuccessful = this.credentialsProvider.refresh();
+            if (isSuccessful) {
+                Map<String, String> currentHeaders = this.headers;
+                this.headers =
+                        RESTUtil.merge(currentHeaders, this.credentialsProvider.authHeader());
+            }
+            return isSuccessful;
+        }
+
+        return false;
+    }
+
     @VisibleForTesting
     static void scheduleTokenRefresh(
             ScheduledExecutorService executor, AuthSession session, long expiresAtMillis) {
         scheduleTokenRefresh(executor, session, expiresAtMillis, 0);
     }
 
+    @VisibleForTesting
+    static long getTimeToWaitByExpiresInMills(long expiresInMillis) {
+        // how much ahead of time to start the refresh to allow it to complete
+        long refreshWindowMillis = Math.min(expiresInMillis, MAX_REFRESH_WINDOW_MILLIS);
+        // how much time to wait before expiration
+        long waitIntervalMillis = expiresInMillis - refreshWindowMillis;
+        // how much time to actually wait
+        return Math.max(waitIntervalMillis, MIN_REFRESH_WAIT_MILLIS);
+    }
+
     private static void scheduleTokenRefresh(
             ScheduledExecutorService executor,
             AuthSession session,
@@ -89,12 +116,7 @@ private static void scheduleTokenRefresh(
             int retryTimes) {
         if (retryTimes < TOKEN_REFRESH_NUM_RETRIES) {
             long expiresInMillis = expiresAtMillis - System.currentTimeMillis();
-            // how much ahead of time to start the refresh to allow it to complete
-            long refreshWindowMillis = Math.min(expiresInMillis, MAX_REFRESH_WINDOW_MILLIS);
-            // how much time to wait before expiration
-            long waitIntervalMillis = expiresInMillis - refreshWindowMillis;
-            // how much time to actually wait
-            long timeToWait = Math.max(waitIntervalMillis, MIN_REFRESH_WAIT_MILLIS);
+            long timeToWait = getTimeToWaitByExpiresInMills(expiresInMillis);
 
             executor.schedule(
                     () -> {
@@ -118,20 +140,4 @@ private static void scheduleTokenRefresh(
             log.warn("Failed to refresh token after {} retries.", TOKEN_REFRESH_NUM_RETRIES);
         }
     }
-
-    public Boolean refresh() {
-        if (this.credentialsProvider.supportRefresh()
-                && this.credentialsProvider.keepRefreshed()
-                && this.credentialsProvider.expiresInMills().isPresent()) {
-            boolean isSuccessful = this.credentialsProvider.refresh();
-            if (isSuccessful) {
-                Map<String, String> currentHeaders = this.headers;
-                this.headers =
-                        RESTUtil.merge(currentHeaders, this.credentialsProvider.authHeader());
-            }
-            return isSuccessful;
-        }
-
-        return false;
-    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/AlreadyExistsException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/AlreadyExistsException.java
new file mode 100644
index 0000000000000..8e30c8375bf91
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/AlreadyExistsException.java
@@ -0,0 +1,27 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 409 means a resource already exists. */
+public class AlreadyExistsException extends RESTException {
+
+    public AlreadyExistsException(String message, Object... args) {
+        super(message, args);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NoSuchResourceException.java b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NoSuchResourceException.java
new file mode 100644
index 0000000000000..cc4c7881f465a
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/exceptions/NoSuchResourceException.java
@@ -0,0 +1,27 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.exceptions;
+
+/** Exception thrown on HTTP 404 means a resource not exists. */
+public class NoSuchResourceException extends RESTException {
+
+    public NoSuchResourceException(String message, Object... args) {
+        super(message, args);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/requests/CreateDatabaseRequest.java b/paimon-core/src/main/java/org/apache/paimon/rest/requests/CreateDatabaseRequest.java
new file mode 100644
index 0000000000000..6067bf544b875
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/requests/CreateDatabaseRequest.java
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.requests;
+
+import org.apache.paimon.rest.RESTRequest;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Map;
+
+/** Request for creating database. */
+public class CreateDatabaseRequest implements RESTRequest {
+
+    private static final String FIELD_NAME = "name";
+    private static final String FIELD_IGNORE_IF_EXISTS = "ignoreIfExists";
+    private static final String FIELD_OPTIONS = "options";
+
+    @JsonProperty(FIELD_NAME)
+    private String name;
+
+    @JsonProperty(FIELD_IGNORE_IF_EXISTS)
+    private boolean ignoreIfExists;
+
+    @JsonProperty(FIELD_OPTIONS)
+    private Map<String, String> options;
+
+    @JsonCreator
+    public CreateDatabaseRequest(
+            @JsonProperty(FIELD_NAME) String name,
+            @JsonProperty(FIELD_IGNORE_IF_EXISTS) boolean ignoreIfExists,
+            @JsonProperty(FIELD_OPTIONS) Map<String, String> options) {
+        this.name = name;
+        this.ignoreIfExists = ignoreIfExists;
+        this.options = options;
+    }
+
+    @JsonGetter(FIELD_NAME)
+    public String getName() {
+        return name;
+    }
+
+    @JsonGetter(FIELD_IGNORE_IF_EXISTS)
+    public boolean getIgnoreIfExists() {
+        return ignoreIfExists;
+    }
+
+    @JsonGetter(FIELD_OPTIONS)
+    public Map<String, String> getOptions() {
+        return options;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java b/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java
new file mode 100644
index 0000000000000..d97f211c1caa8
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java
@@ -0,0 +1,56 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.requests;
+
+import org.apache.paimon.rest.RESTRequest;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+/** Request for DropDatabase. */
+public class DropDatabaseRequest implements RESTRequest {
+
+    private static final String FIELD_IGNORE_IF_EXISTS = "ignoreIfExists";
+    private static final String FIELD_CASCADE = "cascade";
+
+    @JsonProperty(FIELD_IGNORE_IF_EXISTS)
+    private final boolean ignoreIfNotExists;
+
+    @JsonProperty(FIELD_CASCADE)
+    private final boolean cascade;
+
+    @JsonCreator
+    public DropDatabaseRequest(
+            @JsonProperty(FIELD_IGNORE_IF_EXISTS) boolean ignoreIfNotExists,
+            @JsonProperty(FIELD_CASCADE) boolean cascade) {
+        this.ignoreIfNotExists = ignoreIfNotExists;
+        this.cascade = cascade;
+    }
+
+    @JsonGetter(FIELD_IGNORE_IF_EXISTS)
+    public boolean getIgnoreIfNotExists() {
+        return ignoreIfNotExists;
+    }
+
+    @JsonGetter(FIELD_CASCADE)
+    public boolean getCascade() {
+        return cascade;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
index 903cfc84b46d8..e8fff88b09c2d 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ConfigResponse.java
@@ -23,17 +23,16 @@
 
 import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableMap;
 import org.apache.paimon.shade.guava30.com.google.common.collect.Maps;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
-import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonIgnoreProperties;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
-import java.beans.ConstructorProperties;
 import java.util.Map;
 import java.util.Objects;
 
 /** Response for getting config. */
-@JsonIgnoreProperties(ignoreUnknown = true)
 public class ConfigResponse implements RESTResponse {
+
     private static final String FIELD_DEFAULTS = "defaults";
     private static final String FIELD_OVERRIDES = "overrides";
 
@@ -43,8 +42,10 @@ public class ConfigResponse implements RESTResponse {
     @JsonProperty(FIELD_OVERRIDES)
     private Map<String, String> overrides;
 
-    @ConstructorProperties({FIELD_DEFAULTS, FIELD_OVERRIDES})
-    public ConfigResponse(Map<String, String> defaults, Map<String, String> overrides) {
+    @JsonCreator
+    public ConfigResponse(
+            @JsonProperty(FIELD_DEFAULTS) Map<String, String> defaults,
+            @JsonProperty(FIELD_OVERRIDES) Map<String, String> overrides) {
         this.defaults = defaults;
         this.overrides = overrides;
     }
@@ -65,12 +66,12 @@ public Map<String, String> merge(Map<String, String> clientProperties) {
     }
 
     @JsonGetter(FIELD_DEFAULTS)
-    public Map<String, String> defaults() {
+    public Map<String, String> getDefaults() {
         return defaults;
     }
 
     @JsonGetter(FIELD_OVERRIDES)
-    public Map<String, String> overrides() {
+    public Map<String, String> getOverrides() {
         return overrides;
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/CreateDatabaseResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/CreateDatabaseResponse.java
new file mode 100644
index 0000000000000..43c99254f3990
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/CreateDatabaseResponse.java
@@ -0,0 +1,58 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.rest.RESTResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Map;
+
+/** Response for creating database. */
+public class CreateDatabaseResponse implements RESTResponse {
+
+    private static final String FIELD_NAME = "name";
+    private static final String FIELD_OPTIONS = "options";
+
+    @JsonProperty(FIELD_NAME)
+    private String name;
+
+    @JsonProperty(FIELD_OPTIONS)
+    private Map<String, String> options;
+
+    @JsonCreator
+    public CreateDatabaseResponse(
+            @JsonProperty(FIELD_NAME) String name,
+            @JsonProperty(FIELD_OPTIONS) Map<String, String> options) {
+        this.name = name;
+        this.options = options;
+    }
+
+    @JsonGetter(FIELD_NAME)
+    public String getName() {
+        return name;
+    }
+
+    @JsonGetter(FIELD_OPTIONS)
+    public Map<String, String> getOptions() {
+        return options;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/DatabaseName.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/DatabaseName.java
new file mode 100644
index 0000000000000..9a93b2fd1e3da
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/DatabaseName.java
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.rest.RESTMessage;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+/** Class for Database entity. */
+public class DatabaseName implements RESTMessage {
+
+    private static final String FIELD_NAME = "name";
+
+    @JsonProperty(FIELD_NAME)
+    private String name;
+
+    @JsonCreator
+    public DatabaseName(@JsonProperty(FIELD_NAME) String name) {
+        this.name = name;
+    }
+
+    @JsonGetter(FIELD_NAME)
+    public String getName() {
+        return this.name;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
index 685fe53071b66..d24c8f0f9936b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ErrorResponse.java
@@ -18,10 +18,12 @@
 
 package org.apache.paimon.rest.responses;
 
+import org.apache.paimon.rest.RESTResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
 
-import java.beans.ConstructorProperties;
 import java.io.PrintWriter;
 import java.io.StringWriter;
 import java.util.ArrayList;
@@ -29,7 +31,8 @@
 import java.util.List;
 
 /** Response for error. */
-public class ErrorResponse {
+public class ErrorResponse implements RESTResponse {
+
     private static final String FIELD_MESSAGE = "message";
     private static final String FIELD_CODE = "code";
     private static final String FIELD_STACK = "stack";
@@ -49,8 +52,11 @@ public ErrorResponse(String message, Integer code) {
         this.stack = new ArrayList<String>();
     }
 
-    @ConstructorProperties({FIELD_MESSAGE, FIELD_CODE, FIELD_STACK})
-    public ErrorResponse(String message, int code, List<String> stack) {
+    @JsonCreator
+    public ErrorResponse(
+            @JsonProperty(FIELD_MESSAGE) String message,
+            @JsonProperty(FIELD_CODE) int code,
+            @JsonProperty(FIELD_STACK) List<String> stack) {
         this.message = message;
         this.code = code;
         this.stack = stack;
@@ -63,17 +69,17 @@ public ErrorResponse(String message, int code, Throwable throwable) {
     }
 
     @JsonGetter(FIELD_MESSAGE)
-    public String message() {
+    public String getMessage() {
         return message;
     }
 
     @JsonGetter(FIELD_CODE)
-    public Integer code() {
+    public Integer getCode() {
         return code;
     }
 
     @JsonGetter(FIELD_STACK)
-    public List<String> stack() {
+    public List<String> getStack() {
         return stack;
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/GetDatabaseResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/GetDatabaseResponse.java
new file mode 100644
index 0000000000000..f8f7c8794b7b4
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/GetDatabaseResponse.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.catalog.Database;
+import org.apache.paimon.rest.RESTResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Map;
+import java.util.Optional;
+
+import static org.apache.paimon.rest.RESTCatalogInternalOptions.DATABASE_COMMENT;
+
+/** Response for getting database. */
+public class GetDatabaseResponse implements RESTResponse, Database {
+
+    private static final String FIELD_NAME = "name";
+    private static final String FIELD_OPTIONS = "options";
+
+    @JsonProperty(FIELD_NAME)
+    private final String name;
+
+    @JsonProperty(FIELD_OPTIONS)
+    private final Map<String, String> options;
+
+    @JsonCreator
+    public GetDatabaseResponse(
+            @JsonProperty(FIELD_NAME) String name,
+            @JsonProperty(FIELD_OPTIONS) Map<String, String> options) {
+        this.name = name;
+        this.options = options;
+    }
+
+    @JsonGetter(FIELD_NAME)
+    public String getName() {
+        return name;
+    }
+
+    @JsonGetter(FIELD_OPTIONS)
+    public Map<String, String> getOptions() {
+        return options;
+    }
+
+    @Override
+    public String name() {
+        return this.getName();
+    }
+
+    @Override
+    public Map<String, String> options() {
+        return this.getOptions();
+    }
+
+    @Override
+    public Optional<String> comment() {
+        return Optional.ofNullable(
+                this.options.getOrDefault(DATABASE_COMMENT.key(), DATABASE_COMMENT.defaultValue()));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/responses/ListDatabasesResponse.java b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ListDatabasesResponse.java
new file mode 100644
index 0000000000000..38773f354b771
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/responses/ListDatabasesResponse.java
@@ -0,0 +1,45 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest.responses;
+
+import org.apache.paimon.rest.RESTResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.List;
+
+/** Response for listing databases. */
+public class ListDatabasesResponse implements RESTResponse {
+    private static final String FIELD_DATABASES = "databases";
+
+    @JsonProperty(FIELD_DATABASES)
+    private List<DatabaseName> databases;
+
+    @JsonCreator
+    public ListDatabasesResponse(@JsonProperty(FIELD_DATABASES) List<DatabaseName> databases) {
+        this.databases = databases;
+    }
+
+    @JsonGetter(FIELD_DATABASES)
+    public List<DatabaseName> getDatabases() {
+        return this.databases;
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
index 1f1b9c01aace0..340e38f6a7f8a 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/DefaultErrorHandlerTest.java
@@ -18,8 +18,10 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.rest.exceptions.AlreadyExistsException;
 import org.apache.paimon.rest.exceptions.BadRequestException;
 import org.apache.paimon.rest.exceptions.ForbiddenException;
+import org.apache.paimon.rest.exceptions.NoSuchResourceException;
 import org.apache.paimon.rest.exceptions.NotAuthorizedException;
 import org.apache.paimon.rest.exceptions.RESTException;
 import org.apache.paimon.rest.exceptions.ServiceFailureException;
@@ -54,10 +56,16 @@ public void testHandleErrorResponse() {
         assertThrows(
                 ForbiddenException.class,
                 () -> defaultErrorHandler.accept(generateErrorResponse(403)));
+        assertThrows(
+                NoSuchResourceException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(404)));
         assertThrows(
                 RESTException.class, () -> defaultErrorHandler.accept(generateErrorResponse(405)));
         assertThrows(
                 RESTException.class, () -> defaultErrorHandler.accept(generateErrorResponse(406)));
+        assertThrows(
+                AlreadyExistsException.class,
+                () -> defaultErrorHandler.accept(generateErrorResponse(409)));
         assertThrows(
                 ServiceFailureException.class,
                 () -> defaultErrorHandler.accept(generateErrorResponse(500)));
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
index 17c13b932fd20..f12af12a9d359 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
@@ -110,6 +110,20 @@ public void testPostFail() {
         verify(errorHandler, times(1)).accept(any());
     }
 
+    @Test
+    public void testDeleteSuccess() {
+        mockHttpCallWithCode(mockResponseDataStr, 200);
+        MockRESTData response = httpClient.delete(MOCK_PATH, mockResponseData, headers);
+        verify(errorHandler, times(0)).accept(any());
+    }
+
+    @Test
+    public void testDeleteFail() {
+        mockHttpCallWithCode(mockResponseDataStr, 400);
+        httpClient.delete(MOCK_PATH, mockResponseData, headers);
+        verify(errorHandler, times(1)).accept(any());
+    }
+
     private Map<String, String> headers(String token) {
         Map<String, String> header = new HashMap<>();
         header.put("Authorization", "Bearer " + token);
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java
new file mode 100644
index 0000000000000..f111c41f6adae
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java
@@ -0,0 +1,74 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.rest;
+
+import org.apache.paimon.rest.requests.CreateDatabaseRequest;
+import org.apache.paimon.rest.requests.DropDatabaseRequest;
+import org.apache.paimon.rest.responses.CreateDatabaseResponse;
+import org.apache.paimon.rest.responses.DatabaseName;
+import org.apache.paimon.rest.responses.GetDatabaseResponse;
+import org.apache.paimon.rest.responses.ListDatabasesResponse;
+
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+import static org.apache.paimon.rest.RESTCatalogInternalOptions.DATABASE_COMMENT;
+
+/** Mock REST message. */
+public class MockRESTMessage {
+
+    public static String databaseName() {
+        return "database";
+    }
+
+    public static CreateDatabaseRequest createDatabaseRequest(String name) {
+        boolean ignoreIfExists = true;
+        Map<String, String> options = new HashMap<>();
+        options.put("a", "b");
+        return new CreateDatabaseRequest(name, ignoreIfExists, options);
+    }
+
+    public static DropDatabaseRequest dropDatabaseRequest() {
+        boolean ignoreIfNotExists = true;
+        boolean cascade = true;
+        return new DropDatabaseRequest(ignoreIfNotExists, cascade);
+    }
+
+    public static CreateDatabaseResponse createDatabaseResponse(String name) {
+        Map<String, String> options = new HashMap<>();
+        options.put("a", "b");
+        return new CreateDatabaseResponse(name, options);
+    }
+
+    public static GetDatabaseResponse getDatabaseResponse(String name) {
+        Map<String, String> options = new HashMap<>();
+        options.put("a", "b");
+        options.put(DATABASE_COMMENT.key(), "comment");
+        return new GetDatabaseResponse(name, options);
+    }
+
+    public static ListDatabasesResponse listDatabasesResponse(String name) {
+        DatabaseName databaseName = new DatabaseName(name);
+        List<DatabaseName> databaseNameList = new ArrayList<>();
+        databaseNameList.add(databaseName);
+        return new ListDatabasesResponse(databaseNameList);
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
index f3f56e97215f2..cffac6046623d 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
@@ -18,8 +18,15 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.catalog.Database;
 import org.apache.paimon.options.CatalogOptions;
 import org.apache.paimon.options.Options;
+import org.apache.paimon.rest.responses.CreateDatabaseResponse;
+import org.apache.paimon.rest.responses.GetDatabaseResponse;
+import org.apache.paimon.rest.responses.ListDatabasesResponse;
+
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.core.JsonProcessingException;
+import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
 import okhttp3.mockwebserver.MockResponse;
 import okhttp3.mockwebserver.MockWebServer;
@@ -29,14 +36,17 @@
 
 import java.io.IOException;
 import java.util.HashMap;
+import java.util.List;
 import java.util.Map;
 
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertThrows;
+import static org.junit.jupiter.api.Assertions.assertDoesNotThrow;
 
 /** Test for REST Catalog. */
 public class RESTCatalogTest {
 
+    private ObjectMapper mapper = RESTObjectMapper.create();
     private MockWebServer mockWebServer;
     private RESTCatalog restCatalog;
 
@@ -50,7 +60,11 @@ public void setUp() throws IOException {
         String initToken = "init_token";
         options.set(RESTCatalogOptions.TOKEN, initToken);
         options.set(RESTCatalogOptions.THREAD_POOL_SIZE, 1);
-        mockOptions(RESTCatalogInternalOptions.PREFIX.key(), "prefix");
+        String mockResponse =
+                String.format(
+                        "{\"defaults\": {\"%s\": \"%s\"}}",
+                        RESTCatalogInternalOptions.PREFIX.key(), "prefix");
+        mockResponse(mockResponse);
         restCatalog = new RESTCatalog(options);
     }
 
@@ -70,14 +84,50 @@ public void testInitFailWhenDefineWarehouse() {
     public void testGetConfig() {
         String key = "a";
         String value = "b";
-        mockOptions(key, value);
+        String mockResponse = String.format("{\"defaults\": {\"%s\": \"%s\"}}", key, value);
+        mockResponse(mockResponse);
         Map<String, String> header = new HashMap<>();
         Map<String, String> response = restCatalog.fetchOptionsFromServer(header, new HashMap<>());
         assertEquals(value, response.get(key));
     }
 
-    private void mockOptions(String key, String value) {
-        String mockResponse = String.format("{\"defaults\": {\"%s\": \"%s\"}}", key, value);
+    @Test
+    public void testListDatabases() throws JsonProcessingException {
+        String name = MockRESTMessage.databaseName();
+        ListDatabasesResponse response = MockRESTMessage.listDatabasesResponse(name);
+        mockResponse(mapper.writeValueAsString(response));
+        List<String> result = restCatalog.listDatabases();
+        assertEquals(response.getDatabases().size(), result.size());
+        assertEquals(name, result.get(0));
+    }
+
+    @Test
+    public void testCreateDatabase() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        CreateDatabaseResponse response = MockRESTMessage.createDatabaseResponse(name);
+        mockResponse(mapper.writeValueAsString(response));
+        assertDoesNotThrow(() -> restCatalog.createDatabase(name, false, response.getOptions()));
+    }
+
+    @Test
+    public void testGetDatabase() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        GetDatabaseResponse response = MockRESTMessage.getDatabaseResponse(name);
+        mockResponse(mapper.writeValueAsString(response));
+        Database result = restCatalog.getDatabase(name);
+        assertEquals(name, result.name());
+        assertEquals(response.getOptions().size(), result.options().size());
+        assertEquals(response.comment().get(), result.comment().get());
+    }
+
+    @Test
+    public void testDropDatabase() {
+        String name = "name";
+        mockResponse("");
+        assertDoesNotThrow(() -> restCatalog.dropDatabase(name, false, false));
+    }
+
+    private void mockResponse(String mockResponse) {
         MockResponse mockResponseObj =
                 new MockResponse()
                         .setBody(mockResponse)
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
index 83a8805d29a0f..622a989936923 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
@@ -18,8 +18,13 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.rest.requests.CreateDatabaseRequest;
+import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
+import org.apache.paimon.rest.responses.CreateDatabaseResponse;
 import org.apache.paimon.rest.responses.ErrorResponse;
+import org.apache.paimon.rest.responses.GetDatabaseResponse;
+import org.apache.paimon.rest.responses.ListDatabasesResponse;
 
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
@@ -43,7 +48,7 @@ public void configResponseParseTest() throws Exception {
         ConfigResponse response = new ConfigResponse(conf, conf);
         String responseStr = mapper.writeValueAsString(response);
         ConfigResponse parseData = mapper.readValue(responseStr, ConfigResponse.class);
-        assertEquals(conf.get(confKey), parseData.defaults().get(confKey));
+        assertEquals(conf.get(confKey), parseData.getDefaults().get(confKey));
     }
 
     @Test
@@ -53,7 +58,60 @@ public void errorResponseParseTest() throws Exception {
         ErrorResponse response = new ErrorResponse(message, code, new ArrayList<String>());
         String responseStr = mapper.writeValueAsString(response);
         ErrorResponse parseData = mapper.readValue(responseStr, ErrorResponse.class);
-        assertEquals(message, parseData.message());
-        assertEquals(code, parseData.code());
+        assertEquals(message, parseData.getMessage());
+        assertEquals(code, parseData.getCode());
+    }
+
+    @Test
+    public void createDatabaseRequestParseTest() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        CreateDatabaseRequest request = MockRESTMessage.createDatabaseRequest(name);
+        String requestStr = mapper.writeValueAsString(request);
+        CreateDatabaseRequest parseData = mapper.readValue(requestStr, CreateDatabaseRequest.class);
+        assertEquals(request.getName(), parseData.getName());
+        assertEquals(request.getIgnoreIfExists(), parseData.getIgnoreIfExists());
+        assertEquals(request.getOptions().size(), parseData.getOptions().size());
+    }
+
+    @Test
+    public void dropDatabaseRequestParseTest() throws Exception {
+        DropDatabaseRequest request = MockRESTMessage.dropDatabaseRequest();
+        String requestStr = mapper.writeValueAsString(request);
+        DropDatabaseRequest parseData = mapper.readValue(requestStr, DropDatabaseRequest.class);
+        assertEquals(request.getIgnoreIfNotExists(), parseData.getIgnoreIfNotExists());
+        assertEquals(request.getCascade(), parseData.getCascade());
+    }
+
+    @Test
+    public void createDatabaseResponseParseTest() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        CreateDatabaseResponse response = MockRESTMessage.createDatabaseResponse(name);
+        String responseStr = mapper.writeValueAsString(response);
+        CreateDatabaseResponse parseData =
+                mapper.readValue(responseStr, CreateDatabaseResponse.class);
+        assertEquals(name, parseData.getName());
+        assertEquals(response.getOptions().size(), parseData.getOptions().size());
+    }
+
+    @Test
+    public void getDatabaseResponseParseTest() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        GetDatabaseResponse response = MockRESTMessage.getDatabaseResponse(name);
+        String responseStr = mapper.writeValueAsString(response);
+        GetDatabaseResponse parseData = mapper.readValue(responseStr, GetDatabaseResponse.class);
+        assertEquals(name, parseData.getName());
+        assertEquals(response.getOptions().size(), parseData.getOptions().size());
+        assertEquals(response.comment().get(), parseData.comment().get());
+    }
+
+    @Test
+    public void listDatabaseResponseParseTest() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        ListDatabasesResponse response = MockRESTMessage.listDatabasesResponse(name);
+        String responseStr = mapper.writeValueAsString(response);
+        ListDatabasesResponse parseData =
+                mapper.readValue(responseStr, ListDatabasesResponse.class);
+        assertEquals(response.getDatabases().size(), parseData.getDatabases().size());
+        assertEquals(name, parseData.getDatabases().get(0).getName());
     }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
index 81b3ea57b7032..1f4a48fd5e8cb 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/auth/AuthSessionTest.java
@@ -35,6 +35,8 @@
 import java.util.UUID;
 import java.util.concurrent.ScheduledExecutorService;
 
+import static org.apache.paimon.rest.auth.AuthSession.MAX_REFRESH_WINDOW_MILLIS;
+import static org.apache.paimon.rest.auth.AuthSession.MIN_REFRESH_WAIT_MILLIS;
 import static org.apache.paimon.rest.auth.AuthSession.TOKEN_REFRESH_NUM_RETRIES;
 import static org.junit.Assert.assertEquals;
 import static org.mockito.Mockito.verify;
@@ -121,6 +123,22 @@ public void testRetryWhenRefreshFail() throws Exception {
         verify(credentialsProvider, Mockito.times(TOKEN_REFRESH_NUM_RETRIES + 1)).refresh();
     }
 
+    @Test
+    public void testGetTimeToWaitByExpiresInMills() {
+        long expiresInMillis = -100L;
+        long timeToWait = AuthSession.getTimeToWaitByExpiresInMills(expiresInMillis);
+        assertEquals(MIN_REFRESH_WAIT_MILLIS, timeToWait);
+        expiresInMillis = (long) (MAX_REFRESH_WINDOW_MILLIS * 0.5);
+        timeToWait = AuthSession.getTimeToWaitByExpiresInMills(expiresInMillis);
+        assertEquals(MIN_REFRESH_WAIT_MILLIS, timeToWait);
+        expiresInMillis = MAX_REFRESH_WINDOW_MILLIS;
+        timeToWait = AuthSession.getTimeToWaitByExpiresInMills(expiresInMillis);
+        assertEquals(timeToWait, MIN_REFRESH_WAIT_MILLIS);
+        expiresInMillis = MAX_REFRESH_WINDOW_MILLIS * 2L;
+        timeToWait = AuthSession.getTimeToWaitByExpiresInMills(expiresInMillis);
+        assertEquals(timeToWait, MAX_REFRESH_WINDOW_MILLIS);
+    }
+
     private Pair<File, String> generateTokenAndWriteToFile(String fileName) throws IOException {
         File tokenFile = folder.newFile(fileName);
         String token = UUID.randomUUID().toString();
diff --git a/paimon-open-api/generate.sh b/paimon-open-api/generate.sh
index b63aa538abc45..619b642ab760b 100755
--- a/paimon-open-api/generate.sh
+++ b/paimon-open-api/generate.sh
@@ -17,6 +17,7 @@
 
 # Start the application
 cd ..
+mvn spotless:apply
 mvn clean install -DskipTests
 cd ./paimon-open-api
 mvn spring-boot:run &
diff --git a/paimon-open-api/rest-catalog-open-api.yaml b/paimon-open-api/rest-catalog-open-api.yaml
index 432ee123b8d43..2a5d1dc58418e 100644
--- a/paimon-open-api/rest-catalog-open-api.yaml
+++ b/paimon-open-api/rest-catalog-open-api.yaml
@@ -28,6 +28,120 @@ servers:
   - url: http://localhost:8080
     description: Server URL in Development environment
 paths:
+  /api/v1/{prefix}/databases:
+    get:
+      tags:
+        - database
+      summary: List Databases
+      operationId: listDatabases
+      parameters:
+        - name: prefix
+          in: path
+          required: true
+          schema:
+            type: string
+      responses:
+        "200":
+          description: OK
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListDatabasesResponse'
+        "500":
+          description: Internal Server Error
+    post:
+      tags:
+        - database
+      summary: Create Databases
+      operationId: createDatabases
+      parameters:
+        - name: prefix
+          in: path
+          required: true
+          schema:
+            type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/CreateDatabaseRequest'
+      responses:
+        "500":
+          description: Internal Server Error
+        "409":
+          description: Resource has exist
+          content:
+            '*/*':
+              schema:
+                $ref: '#/components/schemas/ErrorResponse'
+        "200":
+          description: OK
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/CreateDatabaseResponse'
+  /api/v1/{prefix}/databases/{database}:
+    get:
+      tags:
+        - database
+      summary: Get Database
+      operationId: getDatabases
+      parameters:
+        - name: prefix
+          in: path
+          required: true
+          schema:
+            type: string
+        - name: database
+          in: path
+          required: true
+          schema:
+            type: string
+      responses:
+        "200":
+          description: OK
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/GetDatabaseResponse'
+        "404":
+          description: Resource not found
+          content:
+            '*/*':
+              schema:
+                $ref: '#/components/schemas/ErrorResponse'
+        "500":
+          description: Internal Server Error
+    delete:
+      tags:
+        - database
+      summary: Drop Database
+      operationId: dropDatabases
+      parameters:
+        - name: prefix
+          in: path
+          required: true
+          schema:
+            type: string
+        - name: database
+          in: path
+          required: true
+          schema:
+            type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/DropDatabaseRequest'
+      responses:
+        "404":
+          description: Resource not found
+          content:
+            '*/*':
+              schema:
+                $ref: '#/components/schemas/ErrorResponse'
+        "500":
+          description: Internal Server Error
   /api/v1/config:
     get:
       tags:
@@ -37,14 +151,67 @@ paths:
       responses:
         "500":
           description: Internal Server Error
-        "201":
-          description: Created
+        "200":
+          description: OK
           content:
             application/json:
               schema:
                 $ref: '#/components/schemas/ConfigResponse'
 components:
   schemas:
+    CreateDatabaseRequest:
+      type: object
+      properties:
+        name:
+          type: string
+        ignoreIfExists:
+          type: boolean
+        options:
+          type: object
+          additionalProperties:
+            type: string
+    ErrorResponse:
+      type: object
+      properties:
+        message:
+          type: string
+        code:
+          type: integer
+          format: int32
+        stack:
+          type: array
+          items:
+            type: string
+    CreateDatabaseResponse:
+      type: object
+      properties:
+        name:
+          type: string
+        options:
+          type: object
+          additionalProperties:
+            type: string
+    DatabaseName:
+      type: object
+      properties:
+        name:
+          type: string
+    ListDatabasesResponse:
+      type: object
+      properties:
+        databases:
+          type: array
+          items:
+            $ref: '#/components/schemas/DatabaseName'
+    GetDatabaseResponse:
+      type: object
+      properties:
+        name:
+          type: string
+        options:
+          type: object
+          additionalProperties:
+            type: string
     ConfigResponse:
       type: object
       properties:
@@ -52,9 +219,14 @@ components:
           type: object
           additionalProperties:
             type: string
-          writeOnly: true
         overrides:
           type: object
           additionalProperties:
             type: string
-          writeOnly: true
+    DropDatabaseRequest:
+      type: object
+      properties:
+        ignoreIfNotExists:
+          type: boolean
+        cascade:
+          type: boolean
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
index b475540571054..364cc5adbb2c6 100644
--- a/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
@@ -19,17 +19,28 @@
 package org.apache.paimon.open.api;
 
 import org.apache.paimon.rest.ResourcePaths;
+import org.apache.paimon.rest.requests.CreateDatabaseRequest;
+import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
+import org.apache.paimon.rest.responses.CreateDatabaseResponse;
+import org.apache.paimon.rest.responses.DatabaseName;
+import org.apache.paimon.rest.responses.ErrorResponse;
+import org.apache.paimon.rest.responses.GetDatabaseResponse;
+import org.apache.paimon.rest.responses.ListDatabasesResponse;
+
+import org.apache.paimon.shade.guava30.com.google.common.collect.ImmutableList;
 
 import io.swagger.v3.oas.annotations.Operation;
 import io.swagger.v3.oas.annotations.media.Content;
 import io.swagger.v3.oas.annotations.media.Schema;
+import io.swagger.v3.oas.annotations.parameters.RequestBody;
 import io.swagger.v3.oas.annotations.responses.ApiResponse;
 import io.swagger.v3.oas.annotations.responses.ApiResponses;
-import org.springframework.http.HttpStatus;
-import org.springframework.http.ResponseEntity;
 import org.springframework.web.bind.annotation.CrossOrigin;
+import org.springframework.web.bind.annotation.DeleteMapping;
 import org.springframework.web.bind.annotation.GetMapping;
+import org.springframework.web.bind.annotation.PathVariable;
+import org.springframework.web.bind.annotation.PostMapping;
 import org.springframework.web.bind.annotation.RestController;
 
 import java.util.HashMap;
@@ -45,7 +56,7 @@ public class RESTCatalogController {
             tags = {"config"})
     @ApiResponses({
         @ApiResponse(
-                responseCode = "201",
+                responseCode = "200",
                 content = {
                     @Content(
                             schema = @Schema(implementation = ConfigResponse.class),
@@ -56,14 +67,99 @@ public class RESTCatalogController {
                 content = {@Content(schema = @Schema())})
     })
     @GetMapping(ResourcePaths.V1_CONFIG)
-    public ResponseEntity<ConfigResponse> getConfig() {
-        try {
-            Map<String, String> defaults = new HashMap<>();
-            Map<String, String> overrides = new HashMap<>();
-            ConfigResponse response = new ConfigResponse(defaults, overrides);
-            return new ResponseEntity<>(response, HttpStatus.CREATED);
-        } catch (Exception e) {
-            return new ResponseEntity<>(null, HttpStatus.INTERNAL_SERVER_ERROR);
-        }
+    public ConfigResponse getConfig() {
+        Map<String, String> defaults = new HashMap<>();
+        Map<String, String> overrides = new HashMap<>();
+        return new ConfigResponse(defaults, overrides);
+    }
+
+    @Operation(
+            summary = "List Databases",
+            tags = {"database"})
+    @ApiResponses({
+        @ApiResponse(
+                responseCode = "200",
+                content = {
+                    @Content(
+                            schema = @Schema(implementation = ListDatabasesResponse.class),
+                            mediaType = "application/json")
+                }),
+        @ApiResponse(
+                responseCode = "500",
+                content = {@Content(schema = @Schema())})
+    })
+    @GetMapping("/api/v1/{prefix}/databases")
+    public ListDatabasesResponse listDatabases(@PathVariable String prefix) {
+        return new ListDatabasesResponse(ImmutableList.of(new DatabaseName("account")));
+    }
+
+    @Operation(
+            summary = "Create Databases",
+            tags = {"database"})
+    @ApiResponses({
+        @ApiResponse(
+                responseCode = "200",
+                content = {
+                    @Content(
+                            schema = @Schema(implementation = CreateDatabaseResponse.class),
+                            mediaType = "application/json")
+                }),
+        @ApiResponse(
+                responseCode = "409",
+                description = "Resource has exist",
+                content = {@Content(schema = @Schema(implementation = ErrorResponse.class))}),
+        @ApiResponse(
+                responseCode = "500",
+                content = {@Content(schema = @Schema())})
+    })
+    @PostMapping("/api/v1/{prefix}/databases")
+    public CreateDatabaseResponse createDatabases(
+            @PathVariable String prefix, @RequestBody CreateDatabaseRequest request) {
+        Map<String, String> properties = new HashMap<>();
+        return new CreateDatabaseResponse("name", properties);
     }
+
+    @Operation(
+            summary = "Get Database",
+            tags = {"database"})
+    @ApiResponses({
+        @ApiResponse(
+                responseCode = "200",
+                content = {
+                    @Content(
+                            schema = @Schema(implementation = GetDatabaseResponse.class),
+                            mediaType = "application/json")
+                }),
+        @ApiResponse(
+                responseCode = "404",
+                description = "Resource not found",
+                content = {@Content(schema = @Schema(implementation = ErrorResponse.class))}),
+        @ApiResponse(
+                responseCode = "500",
+                content = {@Content(schema = @Schema())})
+    })
+    @GetMapping("/api/v1/{prefix}/databases/{database}")
+    public GetDatabaseResponse getDatabases(
+            @PathVariable String prefix, @PathVariable String database) {
+        Map<String, String> options = new HashMap<>();
+        return new GetDatabaseResponse("name", options);
+    }
+
+    @Operation(
+            summary = "Drop Database",
+            tags = {"database"})
+    @ApiResponses({
+        @ApiResponse(
+                responseCode = "404",
+                description = "Resource not found",
+                content = {@Content(schema = @Schema(implementation = ErrorResponse.class))}),
+        @ApiResponse(
+                responseCode = "500",
+                content = {@Content(schema = @Schema())})
+    })
+    @DeleteMapping("/api/v1/{prefix}/databases/{database}")
+    public void dropDatabases(
+            @PathVariable String prefix,
+            @PathVariable String database,
+            @RequestBody DropDatabaseRequest request) {}
 }
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
index 01234c41bbff4..0e28cd95f9d2c 100644
--- a/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
@@ -32,7 +32,6 @@
 /** Config for OpenAPI. */
 @Configuration
 public class OpenAPIConfig {
-
     @Value("${openapi.url}")
     private String devUrl;
 

From 0a07ebc3157da23c91428f80667b2a722c5f6da5 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Thu, 12 Dec 2024 09:09:34 +0800
Subject: [PATCH 142/157] [spark] Fix the build of read type in binlog table
 (#4689)

---
 .../paimon/table/system/BinlogTable.java      | 22 +++++++++++++------
 .../spark/sql/PaimonSystemTableTest.scala     | 16 ++++++++++++++
 2 files changed, 31 insertions(+), 7 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
index b17d61d44e776..08eea468ea70c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/system/BinlogTable.java
@@ -72,13 +72,8 @@ public RowType rowType() {
         List<DataField> fields = new ArrayList<>();
         fields.add(SpecialFields.ROW_KIND);
         for (DataField field : wrapped.rowType().getFields()) {
-            DataField newField =
-                    new DataField(
-                            field.id(),
-                            field.name(),
-                            new ArrayType(field.type().nullable()), // convert to nullable
-                            field.description());
-            fields.add(newField);
+            // convert to nullable
+            fields.add(field.newType(new ArrayType(field.type().nullable())));
         }
         return new RowType(fields);
     }
@@ -99,6 +94,19 @@ private BinlogRead(InnerTableRead dataRead) {
             super(dataRead);
         }
 
+        @Override
+        public InnerTableRead withReadType(RowType readType) {
+            List<DataField> fields = new ArrayList<>();
+            for (DataField field : readType.getFields()) {
+                if (field.name().equals(SpecialFields.ROW_KIND.name())) {
+                    fields.add(field);
+                } else {
+                    fields.add(field.newType(((ArrayType) field.type()).getElementType()));
+                }
+            }
+            return super.withReadType(readType.copy(fields));
+        }
+
         @Override
         public RecordReader<InternalRow> createReader(Split split) throws IOException {
             DataSplit dataSplit = (DataSplit) split;
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
index 64baf6232fd8f..7baa57a54d909 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonSystemTableTest.scala
@@ -81,4 +81,20 @@ class PaimonSystemTableTest extends PaimonSparkTestBase {
       spark.sql("select partition,bucket from `T$buckets`"),
       Row("[2024-10-10, 01]", 0) :: Row("[2024-10-10, 01]", 1) :: Row("[2024-10-10, 01]", 2) :: Nil)
   }
+
+  test("system table: binlog table") {
+    sql("""
+          |CREATE TABLE T (a INT, b INT)
+          |TBLPROPERTIES ('primary-key'='a', 'changelog-producer' = 'lookup', 'bucket' = '2')
+          |""".stripMargin)
+
+    sql("INSERT INTO T VALUES (1, 2)")
+    sql("INSERT INTO T VALUES (1, 3)")
+    sql("INSERT INTO T VALUES (2, 2)")
+
+    checkAnswer(
+      sql("SELECT * FROM `T$binlog`"),
+      Seq(Row("+I", Array(1), Array(3)), Row("+I", Array(2), Array(2)))
+    )
+  }
 }

From f50507d233adc5aa5472dc1fc220bb93177db00d Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Thu, 12 Dec 2024 13:22:43 +0800
Subject: [PATCH 143/157] [core] Clean up invalid branch cache and not cache
 system table in caching catalog (#4681)

---
 .../paimon/catalog/AbstractCatalog.java       |  8 +-
 .../apache/paimon/catalog/CachingCatalog.java | 40 ++++----
 .../org/apache/paimon/catalog/Identifier.java | 16 ++++
 .../paimon/catalog/CachingCatalogTest.java    | 92 ++++++++-----------
 .../procedure/DeleteBranchProcedure.java      |  5 +-
 .../paimon/spark/DataFrameWriteTest.scala     |  5 +
 .../apache/paimon/spark/PaimonSinkTest.scala  |  5 +
 .../paimon/spark/SparkGenericCatalog.java     |  2 +-
 .../procedure/DeleteBranchProcedure.java      | 23 +++--
 .../apache/paimon/spark/PaimonSinkTest.scala  |  5 +
 .../paimon/spark/PaimonSparkTestBase.scala    |  1 -
 .../paimon/spark/sql/DataFrameWriteTest.scala |  6 ++
 12 files changed, 112 insertions(+), 96 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
index 2b277a29b8359..b56fec279ab10 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/AbstractCatalog.java
@@ -381,7 +381,7 @@ public Table getTable(Identifier identifier) throws TableNotExistException {
                 throw new TableNotExistException(identifier);
             }
             return table;
-        } else if (isSpecifiedSystemTable(identifier)) {
+        } else if (identifier.isSystemTable()) {
             Table originTable =
                     getDataOrFormatTable(
                             new Identifier(
@@ -519,12 +519,8 @@ protected void assertMainBranch(Identifier identifier) {
         }
     }
 
-    public static boolean isSpecifiedSystemTable(Identifier identifier) {
-        return identifier.getSystemTableName() != null;
-    }
-
     protected static boolean isTableInSystemDatabase(Identifier identifier) {
-        return isSystemDatabase(identifier.getDatabaseName()) || isSpecifiedSystemTable(identifier);
+        return isSystemDatabase(identifier.getDatabaseName()) || identifier.isSystemTable();
     }
 
     protected static void checkNotSystemTable(Identifier identifier, String method) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
index f67f19700d6e2..e92a589d411e6 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
@@ -26,7 +26,6 @@
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 import org.apache.paimon.table.system.SystemTableLoader;
-import org.apache.paimon.utils.Preconditions;
 import org.apache.paimon.utils.SegmentsCache;
 
 import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
@@ -48,7 +47,6 @@
 import java.util.Map;
 import java.util.Optional;
 
-import static org.apache.paimon.catalog.AbstractCatalog.isSpecifiedSystemTable;
 import static org.apache.paimon.options.CatalogOptions.CACHE_ENABLED;
 import static org.apache.paimon.options.CatalogOptions.CACHE_EXPIRATION_INTERVAL_MS;
 import static org.apache.paimon.options.CatalogOptions.CACHE_MANIFEST_MAX_MEMORY;
@@ -56,7 +54,7 @@
 import static org.apache.paimon.options.CatalogOptions.CACHE_MANIFEST_SMALL_FILE_THRESHOLD;
 import static org.apache.paimon.options.CatalogOptions.CACHE_PARTITION_MAX_NUM;
 import static org.apache.paimon.options.CatalogOptions.CACHE_SNAPSHOT_MAX_NUM_PER_TABLE;
-import static org.apache.paimon.table.system.SystemTableLoader.SYSTEM_TABLES;
+import static org.apache.paimon.utils.Preconditions.checkNotNull;
 
 /** A {@link Catalog} to cache databases and tables and manifests. */
 public class CachingCatalog extends DelegateCatalog {
@@ -203,6 +201,9 @@ public void dropTable(Identifier identifier, boolean ignoreIfNotExists)
             throws TableNotExistException {
         super.dropTable(identifier, ignoreIfNotExists);
         invalidateTable(identifier);
+        if (identifier.isMainTable()) {
+            invalidateAttachedTables(identifier);
+        }
     }
 
     @Override
@@ -227,26 +228,23 @@ public Table getTable(Identifier identifier) throws TableNotExistException {
             return table;
         }
 
-        if (isSpecifiedSystemTable(identifier)) {
+        // For system table, do not cache it directly. Instead, cache the origin table and then wrap
+        // it to generate the system table.
+        if (identifier.isSystemTable()) {
             Identifier originIdentifier =
                     new Identifier(
                             identifier.getDatabaseName(),
                             identifier.getTableName(),
                             identifier.getBranchName(),
                             null);
-            Table originTable = tableCache.getIfPresent(originIdentifier);
-            if (originTable == null) {
-                originTable = wrapped.getTable(originIdentifier);
-                putTableCache(originIdentifier, originTable);
-            }
+            Table originTable = getTable(originIdentifier);
             table =
                     SystemTableLoader.load(
-                            Preconditions.checkNotNull(identifier.getSystemTableName()),
+                            checkNotNull(identifier.getSystemTableName()),
                             (FileStoreTable) originTable);
             if (table == null) {
                 throw new TableNotExistException(identifier);
             }
-            putTableCache(identifier, table);
             return table;
         }
 
@@ -309,7 +307,7 @@ private class TableInvalidatingRemovalListener implements RemovalListener<Identi
         public void onRemoval(Identifier identifier, Table table, @NonNull RemovalCause cause) {
             LOG.debug("Evicted {} from the table cache ({})", identifier, cause);
             if (RemovalCause.EXPIRED.equals(cause)) {
-                tryInvalidateSysTables(identifier);
+                // ignore now
             }
         }
     }
@@ -317,24 +315,18 @@ public void onRemoval(Identifier identifier, Table table, @NonNull RemovalCause
     @Override
     public void invalidateTable(Identifier identifier) {
         tableCache.invalidate(identifier);
-        tryInvalidateSysTables(identifier);
         if (partitionCache != null) {
             partitionCache.invalidate(identifier);
         }
     }
 
-    private void tryInvalidateSysTables(Identifier identifier) {
-        if (!isSpecifiedSystemTable(identifier)) {
-            tableCache.invalidateAll(allSystemTables(identifier));
-        }
-    }
-
-    private static Iterable<Identifier> allSystemTables(Identifier ident) {
-        List<Identifier> tables = new ArrayList<>();
-        for (String type : SYSTEM_TABLES) {
-            tables.add(Identifier.fromString(ident.getFullName() + SYSTEM_TABLE_SPLITTER + type));
+    /** invalidate attached tables, such as cached branches. */
+    private void invalidateAttachedTables(Identifier identifier) {
+        for (@NonNull Identifier i : tableCache.asMap().keySet()) {
+            if (identifier.getTableName().equals(i.getTableName())) {
+                tableCache.invalidate(i);
+            }
         }
-        return tables;
     }
 
     // ================================== refresh ================================================
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java b/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
index 72da69b67b839..6cca6824e32be 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
@@ -65,6 +65,10 @@ public Identifier(String database, String object) {
         this.object = object;
     }
 
+    public Identifier(String database, String table, @Nullable String branch) {
+        this(database, table, branch, null);
+    }
+
     public Identifier(
             String database, String table, @Nullable String branch, @Nullable String systemTable) {
         this.database = database;
@@ -119,6 +123,18 @@ public String getBranchNameOrDefault() {
         return systemTable;
     }
 
+    public boolean isMainTable() {
+        return getBranchName() == null && getSystemTableName() == null;
+    }
+
+    public boolean isBranch() {
+        return getBranchName() != null && getSystemTableName() == null;
+    }
+
+    public boolean isSystemTable() {
+        return getSystemTableName() != null;
+    }
+
     private void splitObjectName() {
         if (table != null) {
             return;
diff --git a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
index 7567f682ae604..4792e33c932b7 100644
--- a/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/catalog/CachingCatalogTest.java
@@ -48,10 +48,8 @@
 import java.io.FileNotFoundException;
 import java.time.Duration;
 import java.util.ArrayList;
-import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
-import java.util.Optional;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
 import java.util.concurrent.TimeUnit;
@@ -101,14 +99,49 @@ public void testInvalidateSystemTablesIfBaseTableIsModified() throws Exception {
 
     @Test
     public void testInvalidateSysTablesIfBaseTableIsDropped() throws Exception {
-        Catalog catalog = new CachingCatalog(this.catalog);
+        TestableCachingCatalog catalog =
+                new TestableCachingCatalog(this.catalog, EXPIRATION_TTL, ticker);
         Identifier tableIdent = new Identifier("db", "tbl");
         catalog.createTable(new Identifier("db", "tbl"), DEFAULT_TABLE_SCHEMA, false);
         Identifier sysIdent = new Identifier("db", "tbl$files");
+        // get system table will only cache the origin table
         catalog.getTable(sysIdent);
+        assertThat(catalog.tableCache.asMap()).containsKey(tableIdent);
+        assertThat(catalog.tableCache.asMap()).doesNotContainKey(sysIdent);
+        // test case sensitivity
+        Identifier sysIdent1 = new Identifier("db", "tbl$SNAPSHOTS");
+        catalog.getTable(sysIdent1);
+        assertThat(catalog.tableCache.asMap()).doesNotContainKey(sysIdent1);
+
         catalog.dropTable(tableIdent, false);
+        assertThat(catalog.tableCache.asMap()).doesNotContainKey(tableIdent);
         assertThatThrownBy(() -> catalog.getTable(sysIdent))
                 .hasMessage("Table db.tbl does not exist.");
+        assertThatThrownBy(() -> catalog.getTable(sysIdent1))
+                .hasMessage("Table db.tbl does not exist.");
+    }
+
+    @Test
+    public void testInvalidateBranchIfBaseTableIsDropped() throws Exception {
+        TestableCachingCatalog catalog =
+                new TestableCachingCatalog(this.catalog, EXPIRATION_TTL, ticker);
+        Identifier tableIdent = new Identifier("db", "tbl");
+        catalog.createTable(new Identifier("db", "tbl"), DEFAULT_TABLE_SCHEMA, false);
+        catalog.getTable(tableIdent).createBranch("b1");
+
+        Identifier branchIdent = new Identifier("db", "tbl$branch_b1");
+        Identifier branchSysIdent = new Identifier("db", "tbl$branch_b1$FILES");
+        // get system table will only cache the origin table
+        catalog.getTable(branchSysIdent);
+        assertThat(catalog.tableCache.asMap()).containsKey(branchIdent);
+        assertThat(catalog.tableCache.asMap()).doesNotContainKey(branchSysIdent);
+
+        catalog.dropTable(tableIdent, false);
+        assertThat(catalog.tableCache.asMap()).doesNotContainKey(branchIdent);
+        assertThatThrownBy(() -> catalog.getTable(branchIdent))
+                .hasMessage("Table db.tbl$branch_b1 does not exist.");
+        assertThatThrownBy(() -> catalog.getTable(branchSysIdent))
+                .hasMessage("Table db.tbl$branch_b1 does not exist.");
     }
 
     @Test
@@ -175,59 +208,6 @@ public void testCatalogExpirationTtlRefreshesAfterAccessViaCatalog() throws Exce
         assertThat(catalog.remainingAgeFor(tableIdent)).get().isEqualTo(HALF_OF_EXPIRATION);
     }
 
-    @Test
-    public void testCacheExpirationEagerlyRemovesSysTables() throws Exception {
-        TestableCachingCatalog catalog =
-                new TestableCachingCatalog(this.catalog, EXPIRATION_TTL, ticker);
-
-        Identifier tableIdent = new Identifier("db", "tbl");
-        catalog.createTable(tableIdent, DEFAULT_TABLE_SCHEMA, false);
-        Table table = catalog.getTable(tableIdent);
-        assertThat(catalog.tableCache().asMap()).containsKey(tableIdent);
-        assertThat(catalog.ageOf(tableIdent)).get().isEqualTo(Duration.ZERO);
-
-        ticker.advance(HALF_OF_EXPIRATION);
-        assertThat(catalog.tableCache().asMap()).containsKey(tableIdent);
-        assertThat(catalog.ageOf(tableIdent)).get().isEqualTo(HALF_OF_EXPIRATION);
-
-        for (Identifier sysTable : sysTables(tableIdent)) {
-            catalog.getTable(sysTable);
-        }
-        assertThat(catalog.tableCache().asMap()).containsKeys(sysTables(tableIdent));
-        assertThat(Arrays.stream(sysTables(tableIdent)).map(catalog::ageOf))
-                .isNotEmpty()
-                .allMatch(age -> age.isPresent() && age.get().equals(Duration.ZERO));
-
-        assertThat(catalog.remainingAgeFor(tableIdent))
-                .as("Loading a non-cached sys table should refresh the main table's age")
-                .isEqualTo(Optional.of(EXPIRATION_TTL));
-
-        // Move time forward and access already cached sys tables.
-        ticker.advance(HALF_OF_EXPIRATION);
-        for (Identifier sysTable : sysTables(tableIdent)) {
-            catalog.getTable(sysTable);
-        }
-        assertThat(Arrays.stream(sysTables(tableIdent)).map(catalog::ageOf))
-                .isNotEmpty()
-                .allMatch(age -> age.isPresent() && age.get().equals(Duration.ZERO));
-
-        assertThat(catalog.remainingAgeFor(tableIdent))
-                .as("Accessing a cached sys table should not affect the main table's age")
-                .isEqualTo(Optional.of(HALF_OF_EXPIRATION));
-
-        // Move time forward so the data table drops.
-        ticker.advance(HALF_OF_EXPIRATION);
-        assertThat(catalog.tableCache().asMap()).doesNotContainKey(tableIdent);
-
-        Arrays.stream(sysTables(tableIdent))
-                .forEach(
-                        sysTable ->
-                                assertThat(catalog.tableCache().asMap())
-                                        .as(
-                                                "When a data table expires, its sys tables should expire regardless of age")
-                                        .doesNotContainKeys(sysTable));
-    }
-
     @Test
     public void testPartitionCache() throws Exception {
         TestableCachingCatalog catalog =
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/DeleteBranchProcedure.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/DeleteBranchProcedure.java
index c95fd62bee40e..56c6490286502 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/DeleteBranchProcedure.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/procedure/DeleteBranchProcedure.java
@@ -49,7 +49,10 @@ public String identifier() {
             })
     public String[] call(ProcedureContext procedureContext, String tableId, String branchStr)
             throws Catalog.TableNotExistException {
-        catalog.getTable(Identifier.fromString(tableId)).deleteBranches(branchStr);
+        Identifier identifier = Identifier.fromString(tableId);
+        catalog.getTable(identifier).deleteBranches(branchStr);
+        catalog.invalidateTable(
+                new Identifier(identifier.getDatabaseName(), identifier.getTableName(), branchStr));
         return new String[] {"Success"};
     }
 }
diff --git a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/DataFrameWriteTest.scala b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/DataFrameWriteTest.scala
index a3cecfc72e1d2..cb449edb4ccbe 100644
--- a/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/DataFrameWriteTest.scala
+++ b/paimon-spark/paimon-spark-3.3/src/test/scala/org/apache/paimon/spark/DataFrameWriteTest.scala
@@ -18,10 +18,15 @@
 
 package org.apache.paimon.spark
 
+import org.apache.spark.SparkConf
 import org.junit.jupiter.api.Assertions
 
 class DataFrameWriteTest extends PaimonSparkTestBase {
 
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf.set("spark.sql.catalog.paimon.cache-enabled", "false")
+  }
+
   test("Paimon: DataFrameWrite.saveAsTable") {
 
     import testImplicits._
diff --git a/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala b/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
index 18fb9e116ba43..ab4a9bcd9dbff 100644
--- a/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
+++ b/paimon-spark/paimon-spark-3.4/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.spark
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.{Dataset, Row}
 import org.apache.spark.sql.execution.streaming.MemoryStream
 import org.apache.spark.sql.functions.{col, mean, window}
@@ -27,6 +28,10 @@ import java.sql.Date
 
 class PaimonSinkTest extends PaimonSparkTestBase with StreamTest {
 
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf.set("spark.sql.catalog.paimon.cache-enabled", "false")
+  }
+
   import testImplicits._
 
   test("Paimon Sink: forEachBatch") {
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
index 9957f0cdf91ff..63d75a53ef2ee 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
@@ -186,7 +186,7 @@ public Table loadTable(Identifier ident, long timestamp) throws NoSuchTableExcep
     @Override
     public void invalidateTable(Identifier ident) {
         // We do not need to check whether the table exists and whether
-        // it is an Paimon table to reduce remote service requests.
+        // it is a Paimon table to reduce remote service requests.
         sparkCatalog.invalidateTable(ident);
         asTableCatalog().invalidateTable(ident);
     }
diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/DeleteBranchProcedure.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/DeleteBranchProcedure.java
index e398eee0261f8..4a01c33d6af1d 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/DeleteBranchProcedure.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/procedure/DeleteBranchProcedure.java
@@ -18,6 +18,8 @@
 
 package org.apache.paimon.spark.procedure;
 
+import org.apache.paimon.spark.catalog.WithPaimonCatalog;
+
 import org.apache.spark.sql.catalyst.InternalRow;
 import org.apache.spark.sql.connector.catalog.Identifier;
 import org.apache.spark.sql.connector.catalog.TableCatalog;
@@ -61,13 +63,20 @@ public StructType outputType() {
     public InternalRow[] call(InternalRow args) {
         Identifier tableIdent = toIdentifier(args.getString(0), PARAMETERS[0].name());
         String branchStr = args.getString(1);
-        return modifyPaimonTable(
-                tableIdent,
-                table -> {
-                    table.deleteBranches(branchStr);
-                    InternalRow outputRow = newInternalRow(true);
-                    return new InternalRow[] {outputRow};
-                });
+        InternalRow[] result =
+                modifyPaimonTable(
+                        tableIdent,
+                        table -> {
+                            table.deleteBranches(branchStr);
+                            InternalRow outputRow = newInternalRow(true);
+                            return new InternalRow[] {outputRow};
+                        });
+        ((WithPaimonCatalog) tableCatalog())
+                .paimonCatalog()
+                .invalidateTable(
+                        new org.apache.paimon.catalog.Identifier(
+                                tableIdent.namespace()[0], tableIdent.name(), branchStr));
+        return result;
     }
 
     public static ProcedureBuilder builder() {
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
index 63203122ac40a..61bf5524942df 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSinkTest.scala
@@ -18,6 +18,7 @@
 
 package org.apache.paimon.spark
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.{Dataset, Row}
 import org.apache.spark.sql.execution.streaming.MemoryStream
 import org.apache.spark.sql.functions.{col, mean, window}
@@ -27,6 +28,10 @@ import java.sql.Date
 
 class PaimonSinkTest extends PaimonSparkTestBase with StreamTest {
 
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf.set("spark.sql.catalog.paimon.cache-enabled", "false")
+  }
+
   import testImplicits._
 
   test("Paimon Sink: forEachBatch") {
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
index 605b2e6ca5f26..867b3e5e33379 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/PaimonSparkTestBase.scala
@@ -66,7 +66,6 @@ class PaimonSparkTestBase
     super.sparkConf
       .set("spark.sql.catalog.paimon", classOf[SparkCatalog].getName)
       .set("spark.sql.catalog.paimon.warehouse", tempDBDir.getCanonicalPath)
-      .set("spark.sql.catalog.paimon.cache-enabled", "false")
       .set("spark.sql.extensions", classOf[PaimonSparkSessionExtensions].getName)
       .set("spark.serializer", serializer)
   }
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
index a0a94afacfb95..edd092c85ce8b 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DataFrameWriteTest.scala
@@ -20,6 +20,7 @@ package org.apache.paimon.spark.sql
 
 import org.apache.paimon.spark.PaimonSparkTestBase
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.types.DecimalType
 import org.junit.jupiter.api.Assertions
@@ -27,6 +28,11 @@ import org.junit.jupiter.api.Assertions
 import java.sql.{Date, Timestamp}
 
 class DataFrameWriteTest extends PaimonSparkTestBase {
+
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf.set("spark.sql.catalog.paimon.cache-enabled", "false")
+  }
+
   import testImplicits._
 
   test("Paimon: DataFrameWrite.saveAsTable") {

From 30dcfb50da92691fed24228fd11665b59d39a6b6 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 12 Dec 2024 13:28:07 +0800
Subject: [PATCH 144/157] [core] Remove useless codes in CachingCatalog

---
 .../apache/paimon/catalog/CachingCatalog.java | 36 ++++---------------
 .../org/apache/paimon/catalog/Identifier.java |  8 -----
 2 files changed, 6 insertions(+), 38 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
index e92a589d411e6..82d503b7a2724 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/CachingCatalog.java
@@ -30,15 +30,9 @@
 
 import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Cache;
 import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Caffeine;
-import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.RemovalCause;
-import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.RemovalListener;
 import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Ticker;
 import org.apache.paimon.shade.caffeine2.com.github.benmanes.caffeine.cache.Weigher;
 
-import org.checkerframework.checker.nullness.qual.NonNull;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
 import javax.annotation.Nullable;
 
 import java.time.Duration;
@@ -59,8 +53,6 @@
 /** A {@link Catalog} to cache databases and tables and manifests. */
 public class CachingCatalog extends DelegateCatalog {
 
-    private static final Logger LOG = LoggerFactory.getLogger(CachingCatalog.class);
-
     private final Duration expirationInterval;
     private final int snapshotMaxNumPerTable;
 
@@ -125,7 +117,6 @@ public CachingCatalog(
         this.tableCache =
                 Caffeine.newBuilder()
                         .softValues()
-                        .removalListener(new TableInvalidatingRemovalListener())
                         .executor(Runnable::run)
                         .expireAfterAccess(expirationInterval)
                         .ticker(ticker)
@@ -201,8 +192,12 @@ public void dropTable(Identifier identifier, boolean ignoreIfNotExists)
             throws TableNotExistException {
         super.dropTable(identifier, ignoreIfNotExists);
         invalidateTable(identifier);
-        if (identifier.isMainTable()) {
-            invalidateAttachedTables(identifier);
+
+        // clear all branch tables of this table
+        for (Identifier i : tableCache.asMap().keySet()) {
+            if (identifier.getTableName().equals(i.getTableName())) {
+                tableCache.invalidate(i);
+            }
         }
     }
 
@@ -302,16 +297,6 @@ public void dropPartition(Identifier identifier, Map<String, String> partitions)
         }
     }
 
-    private class TableInvalidatingRemovalListener implements RemovalListener<Identifier, Table> {
-        @Override
-        public void onRemoval(Identifier identifier, Table table, @NonNull RemovalCause cause) {
-            LOG.debug("Evicted {} from the table cache ({})", identifier, cause);
-            if (RemovalCause.EXPIRED.equals(cause)) {
-                // ignore now
-            }
-        }
-    }
-
     @Override
     public void invalidateTable(Identifier identifier) {
         tableCache.invalidate(identifier);
@@ -320,15 +305,6 @@ public void invalidateTable(Identifier identifier) {
         }
     }
 
-    /** invalidate attached tables, such as cached branches. */
-    private void invalidateAttachedTables(Identifier identifier) {
-        for (@NonNull Identifier i : tableCache.asMap().keySet()) {
-            if (identifier.getTableName().equals(i.getTableName())) {
-                tableCache.invalidate(i);
-            }
-        }
-    }
-
     // ================================== refresh ================================================
     // following caches will affect the latency of table, so refresh method is provided for engine
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java b/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
index 6cca6824e32be..01456f0b3ae19 100644
--- a/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
+++ b/paimon-core/src/main/java/org/apache/paimon/catalog/Identifier.java
@@ -123,14 +123,6 @@ public String getBranchNameOrDefault() {
         return systemTable;
     }
 
-    public boolean isMainTable() {
-        return getBranchName() == null && getSystemTableName() == null;
-    }
-
-    public boolean isBranch() {
-        return getBranchName() != null && getSystemTableName() == null;
-    }
-
     public boolean isSystemTable() {
         return getSystemTableName() != null;
     }

From 841539755bc1ab16556c3899737d5b17075e3ee9 Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 12 Dec 2024 13:39:56 +0800
Subject: [PATCH 145/157] [core] Rename BulkFormatMapping to
 FormatReaderMapping

---
 .../paimon/io/KeyValueFileReaderFactory.java  | 18 ++++++-------
 .../paimon/operation/RawFileSplitRead.java    | 26 +++++++++----------
 ...tMapping.java => FormatReaderMapping.java} | 20 +++++++-------
 ...Test.java => FormatReaderMappingTest.java} | 15 ++++++-----
 4 files changed, 40 insertions(+), 39 deletions(-)
 rename paimon-core/src/main/java/org/apache/paimon/utils/{BulkFormatMapping.java => FormatReaderMapping.java} (96%)
 rename paimon-core/src/test/java/org/apache/paimon/utils/{BulkFormatMappingTest.java => FormatReaderMappingTest.java} (92%)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
index 7d3acd729c55a..e248351b22e20 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
@@ -40,9 +40,9 @@
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.AsyncRecordReader;
-import org.apache.paimon.utils.BulkFormatMapping;
-import org.apache.paimon.utils.BulkFormatMapping.BulkFormatMappingBuilder;
 import org.apache.paimon.utils.FileStorePathFactory;
+import org.apache.paimon.utils.FormatReaderMapping;
+import org.apache.paimon.utils.FormatReaderMapping.BulkFormatMappingBuilder;
 
 import javax.annotation.Nullable;
 
@@ -68,7 +68,7 @@ public class KeyValueFileReaderFactory implements FileReaderFactory<KeyValue> {
     private final DataFilePathFactory pathFactory;
     private final long asyncThreshold;
 
-    private final Map<FormatKey, BulkFormatMapping> bulkFormatMappings;
+    private final Map<FormatKey, FormatReaderMapping> bulkFormatMappings;
     private final BinaryRow partition;
     private final DeletionVector.Factory dvFactory;
 
@@ -120,14 +120,14 @@ private FileRecordReader<KeyValue> createRecordReader(
             throws IOException {
         String formatIdentifier = DataFilePathFactory.formatIdentifier(fileName);
 
-        Supplier<BulkFormatMapping> formatSupplier =
+        Supplier<FormatReaderMapping> formatSupplier =
                 () ->
                         bulkFormatMappingBuilder.build(
                                 formatIdentifier,
                                 schema,
                                 schemaId == schema.id() ? schema : schemaManager.schema(schemaId));
 
-        BulkFormatMapping bulkFormatMapping =
+        FormatReaderMapping formatReaderMapping =
                 reuseFormat
                         ? bulkFormatMappings.computeIfAbsent(
                                 new FormatKey(schemaId, formatIdentifier),
@@ -137,14 +137,14 @@ private FileRecordReader<KeyValue> createRecordReader(
 
         FileRecordReader<InternalRow> fileRecordReader =
                 new DataFileRecordReader(
-                        bulkFormatMapping.getReaderFactory(),
+                        formatReaderMapping.getReaderFactory(),
                         orcPoolSize == null
                                 ? new FormatReaderContext(fileIO, filePath, fileSize)
                                 : new OrcFormatReaderContext(
                                         fileIO, filePath, fileSize, orcPoolSize),
-                        bulkFormatMapping.getIndexMapping(),
-                        bulkFormatMapping.getCastMapping(),
-                        PartitionUtils.create(bulkFormatMapping.getPartitionPair(), partition));
+                        formatReaderMapping.getIndexMapping(),
+                        formatReaderMapping.getCastMapping(),
+                        PartitionUtils.create(formatReaderMapping.getPartitionPair(), partition));
 
         Optional<DeletionVector> deletionVector = dvFactory.create(fileName);
         if (deletionVector.isPresent() && !deletionVector.get().isEmpty()) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
index 46977457c4be5..af92e44636624 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
@@ -46,9 +46,9 @@
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.RowType;
-import org.apache.paimon.utils.BulkFormatMapping;
-import org.apache.paimon.utils.BulkFormatMapping.BulkFormatMappingBuilder;
 import org.apache.paimon.utils.FileStorePathFactory;
+import org.apache.paimon.utils.FormatReaderMapping;
+import org.apache.paimon.utils.FormatReaderMapping.BulkFormatMappingBuilder;
 import org.apache.paimon.utils.IOExceptionSupplier;
 
 import org.slf4j.Logger;
@@ -75,7 +75,7 @@ public class RawFileSplitRead implements SplitRead<InternalRow> {
     private final TableSchema schema;
     private final FileFormatDiscover formatDiscover;
     private final FileStorePathFactory pathFactory;
-    private final Map<FormatKey, BulkFormatMapping> bulkFormatMappings;
+    private final Map<FormatKey, FormatReaderMapping> bulkFormatMappings;
     private final boolean fileIndexReadEnabled;
 
     private RowType readRowType;
@@ -159,7 +159,7 @@ public RecordReader<InternalRow> createReader(
             String formatIdentifier = DataFilePathFactory.formatIdentifier(file.fileName());
             long schemaId = file.schemaId();
 
-            Supplier<BulkFormatMapping> formatSupplier =
+            Supplier<FormatReaderMapping> formatSupplier =
                     () ->
                             bulkFormatMappingBuilder.build(
                                     formatIdentifier,
@@ -168,7 +168,7 @@ public RecordReader<InternalRow> createReader(
                                             ? schema
                                             : schemaManager.schema(schemaId));
 
-            BulkFormatMapping bulkFormatMapping =
+            FormatReaderMapping formatReaderMapping =
                     bulkFormatMappings.computeIfAbsent(
                             new FormatKey(file.schemaId(), formatIdentifier),
                             key -> formatSupplier.get());
@@ -181,7 +181,7 @@ public RecordReader<InternalRow> createReader(
                                     partition,
                                     file,
                                     dataFilePathFactory,
-                                    bulkFormatMapping,
+                                    formatReaderMapping,
                                     dvFactory));
         }
 
@@ -192,7 +192,7 @@ private FileRecordReader<InternalRow> createFileReader(
             BinaryRow partition,
             DataFileMeta file,
             DataFilePathFactory dataFilePathFactory,
-            BulkFormatMapping bulkFormatMapping,
+            FormatReaderMapping formatReaderMapping,
             IOExceptionSupplier<DeletionVector> dvFactory)
             throws IOException {
         FileIndexResult fileIndexResult = null;
@@ -200,8 +200,8 @@ private FileRecordReader<InternalRow> createFileReader(
             fileIndexResult =
                     FileIndexEvaluator.evaluate(
                             fileIO,
-                            bulkFormatMapping.getDataSchema(),
-                            bulkFormatMapping.getDataFilters(),
+                            formatReaderMapping.getDataSchema(),
+                            formatReaderMapping.getDataFilters(),
                             dataFilePathFactory,
                             file);
             if (!fileIndexResult.remain()) {
@@ -217,11 +217,11 @@ private FileRecordReader<InternalRow> createFileReader(
                         fileIndexResult);
         FileRecordReader<InternalRow> fileRecordReader =
                 new DataFileRecordReader(
-                        bulkFormatMapping.getReaderFactory(),
+                        formatReaderMapping.getReaderFactory(),
                         formatReaderContext,
-                        bulkFormatMapping.getIndexMapping(),
-                        bulkFormatMapping.getCastMapping(),
-                        PartitionUtils.create(bulkFormatMapping.getPartitionPair(), partition));
+                        formatReaderMapping.getIndexMapping(),
+                        formatReaderMapping.getCastMapping(),
+                        PartitionUtils.create(formatReaderMapping.getPartitionPair(), partition));
 
         if (fileIndexResult instanceof BitmapIndexResult) {
             fileRecordReader =
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java b/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
similarity index 96%
rename from paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java
rename to paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
index 58ef924df1786..60fc51806877c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/BulkFormatMapping.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
@@ -45,8 +45,8 @@
 import static org.apache.paimon.predicate.PredicateBuilder.excludePredicateWithFields;
 import static org.apache.paimon.table.SpecialFields.KEY_FIELD_ID_START;
 
-/** Class with index mapping and bulk format. */
-public class BulkFormatMapping {
+/** Class with index mapping and format reader. */
+public class FormatReaderMapping {
 
     // Index mapping from data schema fields to table schema fields, this is used to realize paimon
     // schema evolution. And it combines trimeedKeyMapping, which maps key fields to the value
@@ -56,21 +56,21 @@ public class BulkFormatMapping {
     @Nullable private final CastFieldGetter[] castMapping;
     // partition fields mapping, add partition fields to the read fields
     @Nullable private final Pair<int[], RowType> partitionPair;
-    private final FormatReaderFactory bulkFormat;
+    private final FormatReaderFactory readerFactory;
     private final TableSchema dataSchema;
     private final List<Predicate> dataFilters;
 
-    public BulkFormatMapping(
+    public FormatReaderMapping(
             @Nullable int[] indexMapping,
             @Nullable CastFieldGetter[] castMapping,
             @Nullable int[] trimmedKeyMapping,
             @Nullable Pair<int[], RowType> partitionPair,
-            FormatReaderFactory bulkFormat,
+            FormatReaderFactory readerFactory,
             TableSchema dataSchema,
             List<Predicate> dataFilters) {
         this.indexMapping = combine(indexMapping, trimmedKeyMapping);
         this.castMapping = castMapping;
-        this.bulkFormat = bulkFormat;
+        this.readerFactory = readerFactory;
         this.partitionPair = partitionPair;
         this.dataSchema = dataSchema;
         this.dataFilters = dataFilters;
@@ -112,7 +112,7 @@ public Pair<int[], RowType> getPartitionPair() {
     }
 
     public FormatReaderFactory getReaderFactory() {
-        return bulkFormat;
+        return readerFactory;
     }
 
     public TableSchema getDataSchema() {
@@ -123,7 +123,7 @@ public List<Predicate> getDataFilters() {
         return dataFilters;
     }
 
-    /** Builder for {@link BulkFormatMapping}. */
+    /** Builder for {@link FormatReaderMapping}. */
     public static class BulkFormatMappingBuilder {
 
         private final FileFormatDiscover formatDiscover;
@@ -160,7 +160,7 @@ public BulkFormatMappingBuilder(
          * fields. We generate the partitionMappingAndFieldsWithoutPartitionPair which helps reduce
          * the real read fields and tell us how to map it back.
          */
-        public BulkFormatMapping build(
+        public FormatReaderMapping build(
                 String formatIdentifier, TableSchema tableSchema, TableSchema dataSchema) {
 
             // extract the whole data fields in logic.
@@ -187,7 +187,7 @@ public BulkFormatMapping build(
             // build read filters
             List<Predicate> readFilters = readFilters(filters, tableSchema, dataSchema);
 
-            return new BulkFormatMapping(
+            return new FormatReaderMapping(
                     indexCastMapping.getIndexMapping(),
                     indexCastMapping.getCastMapping(),
                     trimmedKeyPair.getLeft(),
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
similarity index 92%
rename from paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java
rename to paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
index 4d5d6e32e85dc..f2fab510a10a5 100644
--- a/paimon-core/src/test/java/org/apache/paimon/utils/BulkFormatMappingTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
@@ -31,8 +31,8 @@
 import java.util.ArrayList;
 import java.util.List;
 
-/** Test for {@link BulkFormatMapping.BulkFormatMappingBuilder}. */
-public class BulkFormatMappingTest {
+/** Test for {@link FormatReaderMapping.BulkFormatMappingBuilder}. */
+public class FormatReaderMappingTest {
 
     @Test
     public void testTrimKeyFields() {
@@ -80,7 +80,7 @@ public void testTrimKeyFields() {
         testFields.add(new DataField(6, String.valueOf(6), DataTypes.STRING()));
 
         Pair<int[], RowType> res =
-                BulkFormatMapping.BulkFormatMappingBuilder.trimKeyFields(testFields, allFields);
+                FormatReaderMapping.BulkFormatMappingBuilder.trimKeyFields(testFields, allFields);
 
         Assertions.assertThat(res.getKey()).containsExactly(0, 1, 2, 3, 1, 4, 2, 0, 5);
 
@@ -124,11 +124,11 @@ public void testTrimKeyWithIndexMapping() {
 
         // map from key fields reading to value fields reading
         Pair<int[], RowType> trimmedKeyPair =
-                BulkFormatMapping.BulkFormatMappingBuilder.trimKeyFields(
+                FormatReaderMapping.BulkFormatMappingBuilder.trimKeyFields(
                         readDataFields, readDataFields);
 
-        BulkFormatMapping bulkFormatMapping =
-                new BulkFormatMapping(
+        FormatReaderMapping formatReaderMapping =
+                new FormatReaderMapping(
                         indexCastMapping.getIndexMapping(),
                         indexCastMapping.getCastMapping(),
                         trimmedKeyPair.getLeft(),
@@ -137,7 +137,8 @@ public void testTrimKeyWithIndexMapping() {
                         null,
                         null);
 
-        Assertions.assertThat(bulkFormatMapping.getIndexMapping()).containsExactly(0, 1, 0, -1, 2);
+        Assertions.assertThat(formatReaderMapping.getIndexMapping())
+                .containsExactly(0, 1, 0, -1, 2);
         List<DataField> trimmed = trimmedKeyPair.getRight().getFields();
         Assertions.assertThat(trimmed.get(0).id()).isEqualTo(1);
         Assertions.assertThat(trimmed.get(1).id()).isEqualTo(0);

From 5a5628ecf0f7c929c56fd0cafde5f06eaaa64cbe Mon Sep 17 00:00:00 2001
From: Jingsong <jingsonglee0@gmail.com>
Date: Thu, 12 Dec 2024 13:44:34 +0800
Subject: [PATCH 146/157] [core] Rename BulkFormatMappingBuilder to
 FormatReaderMapping.Builder

---
 .../paimon/io/KeyValueFileReaderFactory.java    | 17 ++++++++---------
 .../paimon/operation/RawFileSplitRead.java      | 15 +++++++--------
 .../paimon/utils/FormatReaderMapping.java       |  6 +++---
 .../paimon/utils/FormatReaderMappingTest.java   |  8 +++-----
 4 files changed, 21 insertions(+), 25 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
index e248351b22e20..7e272fc97c654 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileReaderFactory.java
@@ -42,7 +42,6 @@
 import org.apache.paimon.utils.AsyncRecordReader;
 import org.apache.paimon.utils.FileStorePathFactory;
 import org.apache.paimon.utils.FormatReaderMapping;
-import org.apache.paimon.utils.FormatReaderMapping.BulkFormatMappingBuilder;
 
 import javax.annotation.Nullable;
 
@@ -64,11 +63,11 @@ public class KeyValueFileReaderFactory implements FileReaderFactory<KeyValue> {
     private final RowType keyType;
     private final RowType valueType;
 
-    private final BulkFormatMappingBuilder bulkFormatMappingBuilder;
+    private final FormatReaderMapping.Builder formatReaderMappingBuilder;
     private final DataFilePathFactory pathFactory;
     private final long asyncThreshold;
 
-    private final Map<FormatKey, FormatReaderMapping> bulkFormatMappings;
+    private final Map<FormatKey, FormatReaderMapping> formatReaderMappings;
     private final BinaryRow partition;
     private final DeletionVector.Factory dvFactory;
 
@@ -78,7 +77,7 @@ private KeyValueFileReaderFactory(
             TableSchema schema,
             RowType keyType,
             RowType valueType,
-            BulkFormatMappingBuilder bulkFormatMappingBuilder,
+            FormatReaderMapping.Builder formatReaderMappingBuilder,
             DataFilePathFactory pathFactory,
             long asyncThreshold,
             BinaryRow partition,
@@ -88,11 +87,11 @@ private KeyValueFileReaderFactory(
         this.schema = schema;
         this.keyType = keyType;
         this.valueType = valueType;
-        this.bulkFormatMappingBuilder = bulkFormatMappingBuilder;
+        this.formatReaderMappingBuilder = formatReaderMappingBuilder;
         this.pathFactory = pathFactory;
         this.asyncThreshold = asyncThreshold;
         this.partition = partition;
-        this.bulkFormatMappings = new HashMap<>();
+        this.formatReaderMappings = new HashMap<>();
         this.dvFactory = dvFactory;
     }
 
@@ -122,14 +121,14 @@ private FileRecordReader<KeyValue> createRecordReader(
 
         Supplier<FormatReaderMapping> formatSupplier =
                 () ->
-                        bulkFormatMappingBuilder.build(
+                        formatReaderMappingBuilder.build(
                                 formatIdentifier,
                                 schema,
                                 schemaId == schema.id() ? schema : schemaManager.schema(schemaId));
 
         FormatReaderMapping formatReaderMapping =
                 reuseFormat
-                        ? bulkFormatMappings.computeIfAbsent(
+                        ? formatReaderMappings.computeIfAbsent(
                                 new FormatKey(schemaId, formatIdentifier),
                                 key -> formatSupplier.get())
                         : formatSupplier.get();
@@ -276,7 +275,7 @@ public KeyValueFileReaderFactory build(
                     schema,
                     finalReadKeyType,
                     readValueType,
-                    new BulkFormatMappingBuilder(
+                    new FormatReaderMapping.Builder(
                             formatDiscover, readTableFields, fieldsExtractor, filters),
                     pathFactory.createDataFilePathFactory(partition, bucket),
                     options.fileReaderAsyncThreshold().getBytes(),
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
index af92e44636624..4fda82f4e88f2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/RawFileSplitRead.java
@@ -48,7 +48,7 @@
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.FileStorePathFactory;
 import org.apache.paimon.utils.FormatReaderMapping;
-import org.apache.paimon.utils.FormatReaderMapping.BulkFormatMappingBuilder;
+import org.apache.paimon.utils.FormatReaderMapping.Builder;
 import org.apache.paimon.utils.IOExceptionSupplier;
 
 import org.slf4j.Logger;
@@ -75,7 +75,7 @@ public class RawFileSplitRead implements SplitRead<InternalRow> {
     private final TableSchema schema;
     private final FileFormatDiscover formatDiscover;
     private final FileStorePathFactory pathFactory;
-    private final Map<FormatKey, FormatReaderMapping> bulkFormatMappings;
+    private final Map<FormatKey, FormatReaderMapping> formatReaderMappings;
     private final boolean fileIndexReadEnabled;
 
     private RowType readRowType;
@@ -94,7 +94,7 @@ public RawFileSplitRead(
         this.schema = schema;
         this.formatDiscover = formatDiscover;
         this.pathFactory = pathFactory;
-        this.bulkFormatMappings = new HashMap<>();
+        this.formatReaderMappings = new HashMap<>();
         this.fileIndexReadEnabled = fileIndexReadEnabled;
         this.readRowType = rowType;
     }
@@ -150,9 +150,8 @@ public RecordReader<InternalRow> createReader(
         List<ReaderSupplier<InternalRow>> suppliers = new ArrayList<>();
 
         List<DataField> readTableFields = readRowType.getFields();
-        BulkFormatMappingBuilder bulkFormatMappingBuilder =
-                new BulkFormatMappingBuilder(
-                        formatDiscover, readTableFields, TableSchema::fields, filters);
+        Builder formatReaderMappingBuilder =
+                new Builder(formatDiscover, readTableFields, TableSchema::fields, filters);
 
         for (int i = 0; i < files.size(); i++) {
             DataFileMeta file = files.get(i);
@@ -161,7 +160,7 @@ public RecordReader<InternalRow> createReader(
 
             Supplier<FormatReaderMapping> formatSupplier =
                     () ->
-                            bulkFormatMappingBuilder.build(
+                            formatReaderMappingBuilder.build(
                                     formatIdentifier,
                                     schema,
                                     schemaId == schema.id()
@@ -169,7 +168,7 @@ public RecordReader<InternalRow> createReader(
                                             : schemaManager.schema(schemaId));
 
             FormatReaderMapping formatReaderMapping =
-                    bulkFormatMappings.computeIfAbsent(
+                    formatReaderMappings.computeIfAbsent(
                             new FormatKey(file.schemaId(), formatIdentifier),
                             key -> formatSupplier.get());
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java b/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
index 60fc51806877c..f6c6287f51b40 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/FormatReaderMapping.java
@@ -124,14 +124,14 @@ public List<Predicate> getDataFilters() {
     }
 
     /** Builder for {@link FormatReaderMapping}. */
-    public static class BulkFormatMappingBuilder {
+    public static class Builder {
 
         private final FileFormatDiscover formatDiscover;
         private final List<DataField> readTableFields;
         private final Function<TableSchema, List<DataField>> fieldsExtractor;
         @Nullable private final List<Predicate> filters;
 
-        public BulkFormatMappingBuilder(
+        public Builder(
                 FileFormatDiscover formatDiscover,
                 List<DataField> readTableFields,
                 Function<TableSchema, List<DataField>> fieldsExtractor,
@@ -143,7 +143,7 @@ public BulkFormatMappingBuilder(
         }
 
         /**
-         * There are three steps here to build BulkFormatMapping:
+         * There are three steps here to build {@link FormatReaderMapping}:
          *
          * <p>1. Calculate the readDataFields, which is what we intend to read from the data schema.
          * Meanwhile, generate the indexCastMapping, which is used to map the index of the
diff --git a/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java b/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
index f2fab510a10a5..dd00d142c83a3 100644
--- a/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/utils/FormatReaderMappingTest.java
@@ -31,7 +31,7 @@
 import java.util.ArrayList;
 import java.util.List;
 
-/** Test for {@link FormatReaderMapping.BulkFormatMappingBuilder}. */
+/** Test for {@link FormatReaderMapping.Builder}. */
 public class FormatReaderMappingTest {
 
     @Test
@@ -79,8 +79,7 @@ public void testTrimKeyFields() {
         testFields.add(new DataField(1, String.valueOf(1), DataTypes.STRING()));
         testFields.add(new DataField(6, String.valueOf(6), DataTypes.STRING()));
 
-        Pair<int[], RowType> res =
-                FormatReaderMapping.BulkFormatMappingBuilder.trimKeyFields(testFields, allFields);
+        Pair<int[], RowType> res = FormatReaderMapping.Builder.trimKeyFields(testFields, allFields);
 
         Assertions.assertThat(res.getKey()).containsExactly(0, 1, 2, 3, 1, 4, 2, 0, 5);
 
@@ -124,8 +123,7 @@ public void testTrimKeyWithIndexMapping() {
 
         // map from key fields reading to value fields reading
         Pair<int[], RowType> trimmedKeyPair =
-                FormatReaderMapping.BulkFormatMappingBuilder.trimKeyFields(
-                        readDataFields, readDataFields);
+                FormatReaderMapping.Builder.trimKeyFields(readDataFields, readDataFields);
 
         FormatReaderMapping formatReaderMapping =
                 new FormatReaderMapping(

From ce1c839eef8ba50a2c65045988a4ade63e2caf90 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Thu, 12 Dec 2024 13:45:47 +0800
Subject: [PATCH 147/157] [spark] Avoid explicitly creating catalog in
 PaimonTableValuedFunctions (#4690)

---
 .../paimon/spark/SparkGenericCatalog.java     | 14 +--
 .../logical/PaimonTableValuedFunctions.scala  | 14 +--
 .../spark/sql/TableValuedFunctionsTest.scala  | 97 +++++++++++--------
 3 files changed, 65 insertions(+), 60 deletions(-)

diff --git a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
index 63d75a53ef2ee..6b7b17b1b1a5e 100644
--- a/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
+++ b/paimon-spark/paimon-spark-common/src/main/java/org/apache/paimon/spark/SparkGenericCatalog.java
@@ -288,12 +288,6 @@ private CaseInsensitiveStringMap autoFillConfigurations(
         Map<String, String> newOptions = new HashMap<>(options.asCaseSensitiveMap());
         fillAliyunConfigurations(newOptions, hadoopConf);
         fillCommonConfigurations(newOptions, sqlConf);
-
-        // if spark is case-insensitive, set allow upper case to catalog
-        if (!sqlConf.caseSensitiveAnalysis()) {
-            newOptions.put(ALLOW_UPPER_CASE.key(), "true");
-        }
-
         return new CaseInsensitiveStringMap(newOptions);
     }
 
@@ -313,13 +307,16 @@ private void fillCommonConfigurations(Map<String, String> options, SQLConf sqlCo
             String warehouse = sqlConf.warehousePath();
             options.put(WAREHOUSE.key(), warehouse);
         }
+
         if (!options.containsKey(METASTORE.key())) {
             String metastore = sqlConf.getConf(StaticSQLConf.CATALOG_IMPLEMENTATION());
             if (HiveCatalogOptions.IDENTIFIER.equals(metastore)) {
                 options.put(METASTORE.key(), metastore);
             }
         }
+
         options.put(CatalogOptions.FORMAT_TABLE_ENABLED.key(), "false");
+
         String sessionCatalogDefaultDatabase = SQLConfUtils.defaultDatabase(sqlConf);
         if (options.containsKey(DEFAULT_DATABASE.key())) {
             String userDefineDefaultDatabase = options.get(DEFAULT_DATABASE.key());
@@ -333,6 +330,11 @@ private void fillCommonConfigurations(Map<String, String> options, SQLConf sqlCo
         } else {
             options.put(DEFAULT_DATABASE.key(), sessionCatalogDefaultDatabase);
         }
+
+        // if spark is case-insensitive, set allow upper case to catalog
+        if (!sqlConf.caseSensitiveAnalysis()) {
+            options.put(ALLOW_UPPER_CASE.key(), "true");
+        }
     }
 
     @Override
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonTableValuedFunctions.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonTableValuedFunctions.scala
index 4d63c2a8d2be7..6edbf533cbbc3 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonTableValuedFunctions.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/catalyst/plans/logical/PaimonTableValuedFunctions.scala
@@ -19,8 +19,6 @@
 package org.apache.paimon.spark.catalyst.plans.logical
 
 import org.apache.paimon.CoreOptions
-import org.apache.paimon.spark.SparkCatalog
-import org.apache.paimon.spark.catalog.Catalogs
 
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.FunctionIdentifier
@@ -28,7 +26,7 @@ import org.apache.spark.sql.catalyst.analysis.FunctionRegistryBase
 import org.apache.spark.sql.catalyst.analysis.TableFunctionRegistry.TableFunctionBuilder
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression, ExpressionInfo}
 import org.apache.spark.sql.catalyst.plans.logical.{LeafNode, LogicalPlan}
-import org.apache.spark.sql.connector.catalog.Identifier
+import org.apache.spark.sql.connector.catalog.{Identifier, TableCatalog}
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 
@@ -40,7 +38,7 @@ object PaimonTableValuedFunctions {
 
   val supportedFnNames: Seq[String] = Seq(INCREMENTAL_QUERY)
 
-  type TableFunctionDescription = (FunctionIdentifier, ExpressionInfo, TableFunctionBuilder)
+  private type TableFunctionDescription = (FunctionIdentifier, ExpressionInfo, TableFunctionBuilder)
 
   def getTableValueFunctionInjection(fnName: String): TableFunctionDescription = {
     val (info, builder) = fnName match {
@@ -60,13 +58,7 @@ object PaimonTableValuedFunctions {
 
     val sessionState = spark.sessionState
     val catalogManager = sessionState.catalogManager
-
-    val sparkCatalog = new SparkCatalog()
-    val currentCatalog = catalogManager.currentCatalog.name()
-    sparkCatalog.initialize(
-      currentCatalog,
-      Catalogs.catalogOptions(currentCatalog, spark.sessionState.conf))
-
+    val sparkCatalog = catalogManager.currentCatalog.asInstanceOf[TableCatalog]
     val tableId = sessionState.sqlParser.parseTableIdentifier(args.head.eval().toString)
     val namespace = tableId.database.map(Array(_)).getOrElse(catalogManager.currentNamespace)
     val ident = Identifier.of(namespace, tableId.table)
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
index 2a689b631acd3..b9c187b83a254 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/TableValuedFunctionsTest.scala
@@ -18,64 +18,75 @@
 
 package org.apache.paimon.spark.sql
 
-import org.apache.paimon.spark.PaimonSparkTestBase
+import org.apache.paimon.spark.PaimonHiveTestBase
 
 import org.apache.spark.sql.{DataFrame, Row}
 
-class TableValuedFunctionsTest extends PaimonSparkTestBase {
+class TableValuedFunctionsTest extends PaimonHiveTestBase {
 
   withPk.foreach {
     hasPk =>
       bucketModes.foreach {
         bucket =>
           test(s"incremental query: hasPk: $hasPk, bucket: $bucket") {
-            val prop = if (hasPk) {
-              s"'primary-key'='a,b', 'bucket' = '$bucket' "
-            } else if (bucket != -1) {
-              s"'bucket-key'='b', 'bucket' = '$bucket' "
-            } else {
-              "'write-only'='true'"
-            }
+            Seq("paimon", sparkCatalogName, paimonHiveCatalogName).foreach {
+              catalogName =>
+                sql(s"use $catalogName")
+
+                withTable("t") {
+                  val prop = if (hasPk) {
+                    s"'primary-key'='a,b', 'bucket' = '$bucket' "
+                  } else if (bucket != -1) {
+                    s"'bucket-key'='b', 'bucket' = '$bucket' "
+                  } else {
+                    "'write-only'='true'"
+                  }
 
-            spark.sql(s"""
-                         |CREATE TABLE T (a INT, b INT, c STRING)
-                         |USING paimon
-                         |TBLPROPERTIES ($prop)
-                         |PARTITIONED BY (a)
-                         |""".stripMargin)
+                  spark.sql(s"""
+                               |CREATE TABLE t (a INT, b INT, c STRING)
+                               |USING paimon
+                               |TBLPROPERTIES ($prop)
+                               |PARTITIONED BY (a)
+                               |""".stripMargin)
 
-            spark.sql("INSERT INTO T values (1, 1, '1'), (2, 2, '2')")
-            spark.sql("INSERT INTO T VALUES (1, 3, '3'), (2, 4, '4')")
-            spark.sql("INSERT INTO T VALUES (1, 5, '5'), (1, 7, '7')")
+                  spark.sql("INSERT INTO t values (1, 1, '1'), (2, 2, '2')")
+                  spark.sql("INSERT INTO t VALUES (1, 3, '3'), (2, 4, '4')")
+                  spark.sql("INSERT INTO t VALUES (1, 5, '5'), (1, 7, '7')")
 
-            checkAnswer(
-              incrementalDF("T", 0, 1).orderBy("a", "b"),
-              Row(1, 1, "1") :: Row(2, 2, "2") :: Nil)
-            checkAnswer(
-              spark.sql("SELECT * FROM paimon_incremental_query('T', '0', '1') ORDER BY a, b"),
-              Row(1, 1, "1") :: Row(2, 2, "2") :: Nil)
+                  checkAnswer(
+                    incrementalDF("t", 0, 1).orderBy("a", "b"),
+                    Row(1, 1, "1") :: Row(2, 2, "2") :: Nil)
+                  checkAnswer(
+                    spark.sql(
+                      "SELECT * FROM paimon_incremental_query('t', '0', '1') ORDER BY a, b"),
+                    Row(1, 1, "1") :: Row(2, 2, "2") :: Nil)
 
-            checkAnswer(
-              incrementalDF("T", 1, 2).orderBy("a", "b"),
-              Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
-            checkAnswer(
-              spark.sql("SELECT * FROM paimon_incremental_query('T', '1', '2') ORDER BY a, b"),
-              Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
+                  checkAnswer(
+                    incrementalDF("t", 1, 2).orderBy("a", "b"),
+                    Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
+                  checkAnswer(
+                    spark.sql(
+                      "SELECT * FROM paimon_incremental_query('t', '1', '2') ORDER BY a, b"),
+                    Row(1, 3, "3") :: Row(2, 4, "4") :: Nil)
 
-            checkAnswer(
-              incrementalDF("T", 2, 3).orderBy("a", "b"),
-              Row(1, 5, "5") :: Row(1, 7, "7") :: Nil)
-            checkAnswer(
-              spark.sql("SELECT * FROM paimon_incremental_query('T', '2', '3') ORDER BY a, b"),
-              Row(1, 5, "5") :: Row(1, 7, "7") :: Nil)
+                  checkAnswer(
+                    incrementalDF("t", 2, 3).orderBy("a", "b"),
+                    Row(1, 5, "5") :: Row(1, 7, "7") :: Nil)
+                  checkAnswer(
+                    spark.sql(
+                      "SELECT * FROM paimon_incremental_query('t', '2', '3') ORDER BY a, b"),
+                    Row(1, 5, "5") :: Row(1, 7, "7") :: Nil)
 
-            checkAnswer(
-              incrementalDF("T", 1, 3).orderBy("a", "b"),
-              Row(1, 3, "3") :: Row(1, 5, "5") :: Row(1, 7, "7") :: Row(2, 4, "4") :: Nil
-            )
-            checkAnswer(
-              spark.sql("SELECT * FROM paimon_incremental_query('T', '1', '3') ORDER BY a, b"),
-              Row(1, 3, "3") :: Row(1, 5, "5") :: Row(1, 7, "7") :: Row(2, 4, "4") :: Nil)
+                  checkAnswer(
+                    incrementalDF("t", 1, 3).orderBy("a", "b"),
+                    Row(1, 3, "3") :: Row(1, 5, "5") :: Row(1, 7, "7") :: Row(2, 4, "4") :: Nil
+                  )
+                  checkAnswer(
+                    spark.sql(
+                      "SELECT * FROM paimon_incremental_query('t', '1', '3') ORDER BY a, b"),
+                    Row(1, 3, "3") :: Row(1, 5, "5") :: Row(1, 7, "7") :: Row(2, 4, "4") :: Nil)
+                }
+            }
           }
       }
   }

From 96bcfda2531dca1270d02bc81a98636f71b8a72c Mon Sep 17 00:00:00 2001
From: lining <lining.jln@alibaba-inc.com>
Date: Thu, 12 Dec 2024 17:02:19 +0800
Subject: [PATCH 148/157] [core] Update drop Database API and remove api in URL
 (#4691)

---
 .../org/apache/paimon/rest/HttpClient.java    | 38 +++------
 .../org/apache/paimon/rest/RESTCatalog.java   | 14 ++--
 .../org/apache/paimon/rest/RESTClient.java    |  2 +-
 .../org/apache/paimon/rest/ResourcePaths.java |  6 +-
 .../rest/requests/DropDatabaseRequest.java    | 56 -------------
 .../apache/paimon/rest/HttpClientTest.java    |  5 +-
 .../apache/paimon/rest/MockRESTMessage.java   | 12 ++-
 .../apache/paimon/rest/RESTCatalogTest.java   | 81 ++++++++++++++++---
 .../paimon/rest/RESTObjectMapperTest.java     | 10 ---
 paimon-open-api/rest-catalog-open-api.yaml    | 60 ++++++--------
 .../open/api/RESTCatalogController.java       | 40 ++++-----
 .../paimon/open/api/config/OpenAPIConfig.java | 36 +++++++++
 .../src/main/resources/application.properties |  4 +
 13 files changed, 180 insertions(+), 184 deletions(-)
 delete mode 100644 paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java

diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
index 97696aef09ed3..87f3fad9b2fd0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/HttpClient.java
@@ -65,17 +65,9 @@ public HttpClient(HttpClientOptions httpClientOptions) {
     @Override
     public <T extends RESTResponse> T get(
             String path, Class<T> responseType, Map<String, String> headers) {
-        try {
-            Request request =
-                    new Request.Builder()
-                            .url(uri + path)
-                            .get()
-                            .headers(Headers.of(headers))
-                            .build();
-            return exec(request, responseType);
-        } catch (Exception e) {
-            throw new RuntimeException(e);
-        }
+        Request request =
+                new Request.Builder().url(uri + path).get().headers(Headers.of(headers)).build();
+        return exec(request, responseType);
     }
 
     @Override
@@ -90,26 +82,16 @@ public <T extends RESTResponse> T post(
                             .headers(Headers.of(headers))
                             .build();
             return exec(request, responseType);
-        } catch (Exception e) {
-            throw new RuntimeException(e);
+        } catch (JsonProcessingException e) {
+            throw new RESTException(e, "build request failed.");
         }
     }
 
     @Override
-    public <T extends RESTResponse> T delete(
-            String path, RESTRequest body, Map<String, String> headers) {
-        try {
-            RequestBody requestBody = buildRequestBody(body);
-            Request request =
-                    new Request.Builder()
-                            .url(uri + path)
-                            .delete(requestBody)
-                            .headers(Headers.of(headers))
-                            .build();
-            return exec(request, null);
-        } catch (Exception e) {
-            throw new RuntimeException(e);
-        }
+    public <T extends RESTResponse> T delete(String path, Map<String, String> headers) {
+        Request request =
+                new Request.Builder().url(uri + path).delete().headers(Headers.of(headers)).build();
+        return exec(request, null);
     }
 
     @Override
@@ -135,6 +117,8 @@ private <T extends RESTResponse> T exec(Request request, Class<T> responseType)
             } else {
                 throw new RESTException("response body is null.");
             }
+        } catch (RESTException e) {
+            throw e;
         } catch (Exception e) {
             throw new RESTException(e, "rest exception");
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
index 3c2538df0ca28..03b257efbf86e 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTCatalog.java
@@ -32,7 +32,6 @@
 import org.apache.paimon.rest.exceptions.AlreadyExistsException;
 import org.apache.paimon.rest.exceptions.NoSuchResourceException;
 import org.apache.paimon.rest.requests.CreateDatabaseRequest;
-import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
 import org.apache.paimon.rest.responses.CreateDatabaseResponse;
 import org.apache.paimon.rest.responses.DatabaseName;
@@ -47,6 +46,7 @@
 import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.ObjectMapper;
 
 import java.time.Duration;
+import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
@@ -160,11 +160,15 @@ public Database getDatabase(String name) throws DatabaseNotExistException {
     @Override
     public void dropDatabase(String name, boolean ignoreIfNotExists, boolean cascade)
             throws DatabaseNotExistException, DatabaseNotEmptyException {
-        DropDatabaseRequest request = new DropDatabaseRequest(ignoreIfNotExists, cascade);
         try {
-            client.delete(resourcePaths.database(name), request, headers());
+            if (!cascade && !this.listTables(name).isEmpty()) {
+                throw new DatabaseNotEmptyException(name);
+            }
+            client.delete(resourcePaths.database(name), headers());
         } catch (NoSuchResourceException e) {
-            throw new DatabaseNotExistException(name);
+            if (!ignoreIfNotExists) {
+                throw new DatabaseNotExistException(name);
+            }
         }
     }
 
@@ -180,7 +184,7 @@ public Path getTableLocation(Identifier identifier) {
 
     @Override
     public List<String> listTables(String databaseName) throws DatabaseNotExistException {
-        throw new UnsupportedOperationException();
+        return new ArrayList<String>();
     }
 
     @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
index d0244f309ef4b..a255d688bc52a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/RESTClient.java
@@ -29,5 +29,5 @@ public interface RESTClient extends Closeable {
     <T extends RESTResponse> T post(
             String path, RESTRequest body, Class<T> responseType, Map<String, String> headers);
 
-    <T extends RESTResponse> T delete(String path, RESTRequest body, Map<String, String> headers);
+    <T extends RESTResponse> T delete(String path, Map<String, String> headers);
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
index a6d0000a225b2..b58053374daac 100644
--- a/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
+++ b/paimon-core/src/main/java/org/apache/paimon/rest/ResourcePaths.java
@@ -23,7 +23,7 @@
 /** Resource paths for REST catalog. */
 public class ResourcePaths {
 
-    public static final String V1_CONFIG = "/api/v1/config";
+    public static final String V1_CONFIG = "/v1/config";
     private static final StringJoiner SLASH = new StringJoiner("/");
 
     public static ResourcePaths forCatalogProperties(String prefix) {
@@ -37,10 +37,10 @@ public ResourcePaths(String prefix) {
     }
 
     public String databases() {
-        return SLASH.add("api").add("v1").add(prefix).add("databases").toString();
+        return SLASH.add("v1").add(prefix).add("databases").toString();
     }
 
     public String database(String databaseName) {
-        return SLASH.add("api").add("v1").add(prefix).add("databases").add(databaseName).toString();
+        return SLASH.add("v1").add(prefix).add("databases").add(databaseName).toString();
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java b/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java
deleted file mode 100644
index d97f211c1caa8..0000000000000
--- a/paimon-core/src/main/java/org/apache/paimon/rest/requests/DropDatabaseRequest.java
+++ /dev/null
@@ -1,56 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.rest.requests;
-
-import org.apache.paimon.rest.RESTRequest;
-
-import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
-import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonGetter;
-import org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
-
-/** Request for DropDatabase. */
-public class DropDatabaseRequest implements RESTRequest {
-
-    private static final String FIELD_IGNORE_IF_EXISTS = "ignoreIfExists";
-    private static final String FIELD_CASCADE = "cascade";
-
-    @JsonProperty(FIELD_IGNORE_IF_EXISTS)
-    private final boolean ignoreIfNotExists;
-
-    @JsonProperty(FIELD_CASCADE)
-    private final boolean cascade;
-
-    @JsonCreator
-    public DropDatabaseRequest(
-            @JsonProperty(FIELD_IGNORE_IF_EXISTS) boolean ignoreIfNotExists,
-            @JsonProperty(FIELD_CASCADE) boolean cascade) {
-        this.ignoreIfNotExists = ignoreIfNotExists;
-        this.cascade = cascade;
-    }
-
-    @JsonGetter(FIELD_IGNORE_IF_EXISTS)
-    public boolean getIgnoreIfNotExists() {
-        return ignoreIfNotExists;
-    }
-
-    @JsonGetter(FIELD_CASCADE)
-    public boolean getCascade() {
-        return cascade;
-    }
-}
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
index f12af12a9d359..a3b06b8ce3a9f 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/HttpClientTest.java
@@ -43,6 +43,7 @@
 
 /** Test for {@link HttpClient}. */
 public class HttpClientTest {
+
     private MockWebServer mockWebServer;
     private HttpClient httpClient;
     private ObjectMapper objectMapper = RESTObjectMapper.create();
@@ -113,14 +114,14 @@ public void testPostFail() {
     @Test
     public void testDeleteSuccess() {
         mockHttpCallWithCode(mockResponseDataStr, 200);
-        MockRESTData response = httpClient.delete(MOCK_PATH, mockResponseData, headers);
+        MockRESTData response = httpClient.delete(MOCK_PATH, headers);
         verify(errorHandler, times(0)).accept(any());
     }
 
     @Test
     public void testDeleteFail() {
         mockHttpCallWithCode(mockResponseDataStr, 400);
-        httpClient.delete(MOCK_PATH, mockResponseData, headers);
+        httpClient.delete(MOCK_PATH, headers);
         verify(errorHandler, times(1)).accept(any());
     }
 
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java
index f111c41f6adae..a605e5e77c2a3 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/MockRESTMessage.java
@@ -19,9 +19,9 @@
 package org.apache.paimon.rest;
 
 import org.apache.paimon.rest.requests.CreateDatabaseRequest;
-import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.CreateDatabaseResponse;
 import org.apache.paimon.rest.responses.DatabaseName;
+import org.apache.paimon.rest.responses.ErrorResponse;
 import org.apache.paimon.rest.responses.GetDatabaseResponse;
 import org.apache.paimon.rest.responses.ListDatabasesResponse;
 
@@ -46,12 +46,6 @@ public static CreateDatabaseRequest createDatabaseRequest(String name) {
         return new CreateDatabaseRequest(name, ignoreIfExists, options);
     }
 
-    public static DropDatabaseRequest dropDatabaseRequest() {
-        boolean ignoreIfNotExists = true;
-        boolean cascade = true;
-        return new DropDatabaseRequest(ignoreIfNotExists, cascade);
-    }
-
     public static CreateDatabaseResponse createDatabaseResponse(String name) {
         Map<String, String> options = new HashMap<>();
         options.put("a", "b");
@@ -71,4 +65,8 @@ public static ListDatabasesResponse listDatabasesResponse(String name) {
         databaseNameList.add(databaseName);
         return new ListDatabasesResponse(databaseNameList);
     }
+
+    public static ErrorResponse noSuchResourceExceptionErrorResponse() {
+        return new ErrorResponse("message", 404, new ArrayList<>());
+    }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
index cffac6046623d..0fff81afdcdec 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTCatalogTest.java
@@ -18,10 +18,12 @@
 
 package org.apache.paimon.rest;
 
+import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.catalog.Database;
 import org.apache.paimon.options.CatalogOptions;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.rest.responses.CreateDatabaseResponse;
+import org.apache.paimon.rest.responses.ErrorResponse;
 import org.apache.paimon.rest.responses.GetDatabaseResponse;
 import org.apache.paimon.rest.responses.ListDatabasesResponse;
 
@@ -35,6 +37,7 @@
 import org.junit.Test;
 
 import java.io.IOException;
+import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
@@ -42,13 +45,19 @@
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertThrows;
 import static org.junit.jupiter.api.Assertions.assertDoesNotThrow;
+import static org.mockito.ArgumentMatchers.eq;
+import static org.mockito.Mockito.spy;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.when;
 
 /** Test for REST Catalog. */
 public class RESTCatalogTest {
 
-    private ObjectMapper mapper = RESTObjectMapper.create();
+    private final ObjectMapper mapper = RESTObjectMapper.create();
     private MockWebServer mockWebServer;
     private RESTCatalog restCatalog;
+    private RESTCatalog mockRestCatalog;
 
     @Before
     public void setUp() throws IOException {
@@ -64,8 +73,9 @@ public void setUp() throws IOException {
                 String.format(
                         "{\"defaults\": {\"%s\": \"%s\"}}",
                         RESTCatalogInternalOptions.PREFIX.key(), "prefix");
-        mockResponse(mockResponse);
+        mockResponse(mockResponse, 200);
         restCatalog = new RESTCatalog(options);
+        mockRestCatalog = spy(restCatalog);
     }
 
     @After
@@ -85,7 +95,7 @@ public void testGetConfig() {
         String key = "a";
         String value = "b";
         String mockResponse = String.format("{\"defaults\": {\"%s\": \"%s\"}}", key, value);
-        mockResponse(mockResponse);
+        mockResponse(mockResponse, 200);
         Map<String, String> header = new HashMap<>();
         Map<String, String> response = restCatalog.fetchOptionsFromServer(header, new HashMap<>());
         assertEquals(value, response.get(key));
@@ -95,7 +105,7 @@ public void testGetConfig() {
     public void testListDatabases() throws JsonProcessingException {
         String name = MockRESTMessage.databaseName();
         ListDatabasesResponse response = MockRESTMessage.listDatabasesResponse(name);
-        mockResponse(mapper.writeValueAsString(response));
+        mockResponse(mapper.writeValueAsString(response), 200);
         List<String> result = restCatalog.listDatabases();
         assertEquals(response.getDatabases().size(), result.size());
         assertEquals(name, result.get(0));
@@ -105,7 +115,7 @@ public void testListDatabases() throws JsonProcessingException {
     public void testCreateDatabase() throws Exception {
         String name = MockRESTMessage.databaseName();
         CreateDatabaseResponse response = MockRESTMessage.createDatabaseResponse(name);
-        mockResponse(mapper.writeValueAsString(response));
+        mockResponse(mapper.writeValueAsString(response), 200);
         assertDoesNotThrow(() -> restCatalog.createDatabase(name, false, response.getOptions()));
     }
 
@@ -113,7 +123,7 @@ public void testCreateDatabase() throws Exception {
     public void testGetDatabase() throws Exception {
         String name = MockRESTMessage.databaseName();
         GetDatabaseResponse response = MockRESTMessage.getDatabaseResponse(name);
-        mockResponse(mapper.writeValueAsString(response));
+        mockResponse(mapper.writeValueAsString(response), 200);
         Database result = restCatalog.getDatabase(name);
         assertEquals(name, result.name());
         assertEquals(response.getOptions().size(), result.options().size());
@@ -121,15 +131,64 @@ public void testGetDatabase() throws Exception {
     }
 
     @Test
-    public void testDropDatabase() {
-        String name = "name";
-        mockResponse("");
-        assertDoesNotThrow(() -> restCatalog.dropDatabase(name, false, false));
+    public void testDropDatabase() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        mockResponse("", 200);
+        assertDoesNotThrow(() -> mockRestCatalog.dropDatabase(name, false, true));
+        verify(mockRestCatalog, times(1)).dropDatabase(eq(name), eq(false), eq(true));
+        verify(mockRestCatalog, times(0)).listTables(eq(name));
+    }
+
+    @Test
+    public void testDropDatabaseWhenNoExistAndIgnoreIfNotExistsIsFalse() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        ErrorResponse response = MockRESTMessage.noSuchResourceExceptionErrorResponse();
+        mockResponse(mapper.writeValueAsString(response), 404);
+        assertThrows(
+                Catalog.DatabaseNotExistException.class,
+                () -> mockRestCatalog.dropDatabase(name, false, true));
+    }
+
+    @Test
+    public void testDropDatabaseWhenNoExistAndIgnoreIfNotExistsIsTrue() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        ErrorResponse response = MockRESTMessage.noSuchResourceExceptionErrorResponse();
+        mockResponse(mapper.writeValueAsString(response), 404);
+        assertDoesNotThrow(() -> mockRestCatalog.dropDatabase(name, true, true));
+        verify(mockRestCatalog, times(1)).dropDatabase(eq(name), eq(true), eq(true));
+        verify(mockRestCatalog, times(0)).listTables(eq(name));
+    }
+
+    @Test
+    public void testDropDatabaseWhenCascadeIsFalseAndNoTables() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        boolean cascade = false;
+        mockResponse("", 200);
+        when(mockRestCatalog.listTables(name)).thenReturn(new ArrayList<>());
+        assertDoesNotThrow(() -> mockRestCatalog.dropDatabase(name, false, cascade));
+        verify(mockRestCatalog, times(1)).dropDatabase(eq(name), eq(false), eq(cascade));
+        verify(mockRestCatalog, times(1)).listTables(eq(name));
+    }
+
+    @Test
+    public void testDropDatabaseWhenCascadeIsFalseAndTablesExist() throws Exception {
+        String name = MockRESTMessage.databaseName();
+        boolean cascade = false;
+        mockResponse("", 200);
+        List<String> tables = new ArrayList<>();
+        tables.add("t1");
+        when(mockRestCatalog.listTables(name)).thenReturn(tables);
+        assertThrows(
+                Catalog.DatabaseNotEmptyException.class,
+                () -> mockRestCatalog.dropDatabase(name, false, cascade));
+        verify(mockRestCatalog, times(1)).dropDatabase(eq(name), eq(false), eq(cascade));
+        verify(mockRestCatalog, times(1)).listTables(eq(name));
     }
 
-    private void mockResponse(String mockResponse) {
+    private void mockResponse(String mockResponse, int httpCode) {
         MockResponse mockResponseObj =
                 new MockResponse()
+                        .setResponseCode(httpCode)
                         .setBody(mockResponse)
                         .addHeader("Content-Type", "application/json");
         mockWebServer.enqueue(mockResponseObj);
diff --git a/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
index 622a989936923..7fee81ef10243 100644
--- a/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/rest/RESTObjectMapperTest.java
@@ -19,7 +19,6 @@
 package org.apache.paimon.rest;
 
 import org.apache.paimon.rest.requests.CreateDatabaseRequest;
-import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
 import org.apache.paimon.rest.responses.CreateDatabaseResponse;
 import org.apache.paimon.rest.responses.ErrorResponse;
@@ -73,15 +72,6 @@ public void createDatabaseRequestParseTest() throws Exception {
         assertEquals(request.getOptions().size(), parseData.getOptions().size());
     }
 
-    @Test
-    public void dropDatabaseRequestParseTest() throws Exception {
-        DropDatabaseRequest request = MockRESTMessage.dropDatabaseRequest();
-        String requestStr = mapper.writeValueAsString(request);
-        DropDatabaseRequest parseData = mapper.readValue(requestStr, DropDatabaseRequest.class);
-        assertEquals(request.getIgnoreIfNotExists(), parseData.getIgnoreIfNotExists());
-        assertEquals(request.getCascade(), parseData.getCascade());
-    }
-
     @Test
     public void createDatabaseResponseParseTest() throws Exception {
         String name = MockRESTMessage.databaseName();
diff --git a/paimon-open-api/rest-catalog-open-api.yaml b/paimon-open-api/rest-catalog-open-api.yaml
index 2a5d1dc58418e..9b69b3de27765 100644
--- a/paimon-open-api/rest-catalog-open-api.yaml
+++ b/paimon-open-api/rest-catalog-open-api.yaml
@@ -28,7 +28,7 @@ servers:
   - url: http://localhost:8080
     description: Server URL in Development environment
 paths:
-  /api/v1/{prefix}/databases:
+  /v1/{prefix}/databases:
     get:
       tags:
         - database
@@ -66,21 +66,21 @@ paths:
             schema:
               $ref: '#/components/schemas/CreateDatabaseRequest'
       responses:
-        "500":
-          description: Internal Server Error
-        "409":
-          description: Resource has exist
-          content:
-            '*/*':
-              schema:
-                $ref: '#/components/schemas/ErrorResponse'
         "200":
           description: OK
           content:
             application/json:
               schema:
                 $ref: '#/components/schemas/CreateDatabaseResponse'
-  /api/v1/{prefix}/databases/{database}:
+        "409":
+          description: Resource has exist
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ErrorResponse'
+        "500":
+          description: Internal Server Error
+  /v1/{prefix}/databases/{database}:
     get:
       tags:
         - database
@@ -107,7 +107,7 @@ paths:
         "404":
           description: Resource not found
           content:
-            '*/*':
+            application/json:
               schema:
                 $ref: '#/components/schemas/ErrorResponse'
         "500":
@@ -128,35 +128,30 @@ paths:
           required: true
           schema:
             type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/DropDatabaseRequest'
       responses:
         "404":
           description: Resource not found
           content:
-            '*/*':
+            application/json:
               schema:
                 $ref: '#/components/schemas/ErrorResponse'
         "500":
           description: Internal Server Error
-  /api/v1/config:
+  /v1/config:
     get:
       tags:
         - config
       summary: Get Config
       operationId: getConfig
       responses:
-        "500":
-          description: Internal Server Error
         "200":
           description: OK
           content:
             application/json:
               schema:
                 $ref: '#/components/schemas/ConfigResponse'
+        "500":
+          description: Internal Server Error
 components:
   schemas:
     CreateDatabaseRequest:
@@ -170,6 +165,15 @@ components:
           type: object
           additionalProperties:
             type: string
+    CreateDatabaseResponse:
+      type: object
+      properties:
+        name:
+          type: string
+        options:
+          type: object
+          additionalProperties:
+            type: string
     ErrorResponse:
       type: object
       properties:
@@ -182,15 +186,6 @@ components:
           type: array
           items:
             type: string
-    CreateDatabaseResponse:
-      type: object
-      properties:
-        name:
-          type: string
-        options:
-          type: object
-          additionalProperties:
-            type: string
     DatabaseName:
       type: object
       properties:
@@ -223,10 +218,3 @@ components:
           type: object
           additionalProperties:
             type: string
-    DropDatabaseRequest:
-      type: object
-      properties:
-        ignoreIfNotExists:
-          type: boolean
-        cascade:
-          type: boolean
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
index 364cc5adbb2c6..19f6f8cdf6734 100644
--- a/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/RESTCatalogController.java
@@ -20,7 +20,6 @@
 
 import org.apache.paimon.rest.ResourcePaths;
 import org.apache.paimon.rest.requests.CreateDatabaseRequest;
-import org.apache.paimon.rest.requests.DropDatabaseRequest;
 import org.apache.paimon.rest.responses.ConfigResponse;
 import org.apache.paimon.rest.responses.CreateDatabaseResponse;
 import org.apache.paimon.rest.responses.DatabaseName;
@@ -57,11 +56,7 @@ public class RESTCatalogController {
     @ApiResponses({
         @ApiResponse(
                 responseCode = "200",
-                content = {
-                    @Content(
-                            schema = @Schema(implementation = ConfigResponse.class),
-                            mediaType = "application/json")
-                }),
+                content = {@Content(schema = @Schema(implementation = ConfigResponse.class))}),
         @ApiResponse(
                 responseCode = "500",
                 content = {@Content(schema = @Schema())})
@@ -80,15 +75,13 @@ public ConfigResponse getConfig() {
         @ApiResponse(
                 responseCode = "200",
                 content = {
-                    @Content(
-                            schema = @Schema(implementation = ListDatabasesResponse.class),
-                            mediaType = "application/json")
+                    @Content(schema = @Schema(implementation = ListDatabasesResponse.class))
                 }),
         @ApiResponse(
                 responseCode = "500",
                 content = {@Content(schema = @Schema())})
     })
-    @GetMapping("/api/v1/{prefix}/databases")
+    @GetMapping("/v1/{prefix}/databases")
     public ListDatabasesResponse listDatabases(@PathVariable String prefix) {
         return new ListDatabasesResponse(ImmutableList.of(new DatabaseName("account")));
     }
@@ -100,19 +93,21 @@ public ListDatabasesResponse listDatabases(@PathVariable String prefix) {
         @ApiResponse(
                 responseCode = "200",
                 content = {
-                    @Content(
-                            schema = @Schema(implementation = CreateDatabaseResponse.class),
-                            mediaType = "application/json")
+                    @Content(schema = @Schema(implementation = CreateDatabaseResponse.class))
                 }),
         @ApiResponse(
                 responseCode = "409",
                 description = "Resource has exist",
-                content = {@Content(schema = @Schema(implementation = ErrorResponse.class))}),
+                content = {
+                    @Content(
+                            schema = @Schema(implementation = ErrorResponse.class),
+                            mediaType = "application/json")
+                }),
         @ApiResponse(
                 responseCode = "500",
                 content = {@Content(schema = @Schema())})
     })
-    @PostMapping("/api/v1/{prefix}/databases")
+    @PostMapping("/v1/{prefix}/databases")
     public CreateDatabaseResponse createDatabases(
             @PathVariable String prefix, @RequestBody CreateDatabaseRequest request) {
         Map<String, String> properties = new HashMap<>();
@@ -125,11 +120,7 @@ public CreateDatabaseResponse createDatabases(
     @ApiResponses({
         @ApiResponse(
                 responseCode = "200",
-                content = {
-                    @Content(
-                            schema = @Schema(implementation = GetDatabaseResponse.class),
-                            mediaType = "application/json")
-                }),
+                content = {@Content(schema = @Schema(implementation = GetDatabaseResponse.class))}),
         @ApiResponse(
                 responseCode = "404",
                 description = "Resource not found",
@@ -138,7 +129,7 @@ public CreateDatabaseResponse createDatabases(
                 responseCode = "500",
                 content = {@Content(schema = @Schema())})
     })
-    @GetMapping("/api/v1/{prefix}/databases/{database}")
+    @GetMapping("/v1/{prefix}/databases/{database}")
     public GetDatabaseResponse getDatabases(
             @PathVariable String prefix, @PathVariable String database) {
         Map<String, String> options = new HashMap<>();
@@ -157,9 +148,6 @@ public GetDatabaseResponse getDatabases(
                 responseCode = "500",
                 content = {@Content(schema = @Schema())})
     })
-    @DeleteMapping("/api/v1/{prefix}/databases/{database}")
-    public void dropDatabases(
-            @PathVariable String prefix,
-            @PathVariable String database,
-            @RequestBody DropDatabaseRequest request) {}
+    @DeleteMapping("/v1/{prefix}/databases/{database}")
+    public void dropDatabases(@PathVariable String prefix, @PathVariable String database) {}
 }
diff --git a/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
index 0e28cd95f9d2c..71ac066d4a70c 100644
--- a/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
+++ b/paimon-open-api/src/main/java/org/apache/paimon/open/api/config/OpenAPIConfig.java
@@ -21,17 +21,21 @@
 import io.swagger.v3.oas.models.OpenAPI;
 import io.swagger.v3.oas.models.info.Info;
 import io.swagger.v3.oas.models.info.License;
+import io.swagger.v3.oas.models.responses.ApiResponses;
 import io.swagger.v3.oas.models.servers.Server;
+import org.springdoc.core.customizers.OpenApiCustomiser;
 import org.springframework.beans.factory.annotation.Value;
 import org.springframework.context.annotation.Bean;
 import org.springframework.context.annotation.Configuration;
 
 import java.util.ArrayList;
+import java.util.Comparator;
 import java.util.List;
 
 /** Config for OpenAPI. */
 @Configuration
 public class OpenAPIConfig {
+
     @Value("${openapi.url}")
     private String devUrl;
 
@@ -56,4 +60,36 @@ public OpenAPI restCatalogOpenAPI() {
         servers.add(server);
         return new OpenAPI().info(info).servers(servers);
     }
+
+    /** Sort response alphabetically. So the api generate will in same order everytime. */
+    @Bean
+    public OpenApiCustomiser sortResponseAlphabetically() {
+        return openApi -> {
+            openApi.getPaths()
+                    .values()
+                    .forEach(
+                            path ->
+                                    path.readOperations()
+                                            .forEach(
+                                                    operation -> {
+                                                        ApiResponses responses =
+                                                                operation.getResponses();
+                                                        if (responses != null) {
+                                                            ApiResponses sortedResponses =
+                                                                    new ApiResponses();
+                                                            List<String> keys =
+                                                                    new ArrayList<>(
+                                                                            responses.keySet());
+                                                            keys.sort(Comparator.naturalOrder());
+
+                                                            for (String key : keys) {
+                                                                sortedResponses.addApiResponse(
+                                                                        key, responses.get(key));
+                                                            }
+
+                                                            operation.setResponses(sortedResponses);
+                                                        }
+                                                    }));
+        };
+    }
 }
diff --git a/paimon-open-api/src/main/resources/application.properties b/paimon-open-api/src/main/resources/application.properties
index 58a975161145b..1e7a987c9d403 100644
--- a/paimon-open-api/src/main/resources/application.properties
+++ b/paimon-open-api/src/main/resources/application.properties
@@ -19,4 +19,8 @@ springdoc.api-docs.path=/swagger-api-docs
 springdoc.swagger-ui.deepLinking=true
 springdoc.swagger-ui.tryItOutEnabled=true
 springdoc.swagger-ui.filter=true
+springdoc.swagger-ui.tagsSorter=alpha
+springdoc.swagger-ui.operations-sorter=alpha
+# define response default media type
+springdoc.default-produces-media-type=application/json
 openapi.url=http://localhost:8080

From a0680bd0ab5ae9d2833a4e27ad923ce8a7061545 Mon Sep 17 00:00:00 2001
From: jiangmengmeng <1804226997@qq.com>
Date: Thu, 12 Dec 2024 17:03:39 +0800
Subject: [PATCH 149/157] [doc] update totalRecordCount and deltaRecordCount in
 understand-files.md (#4694)

---
 docs/content/learn-paimon/understand-files.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/content/learn-paimon/understand-files.md b/docs/content/learn-paimon/understand-files.md
index 8f67f85eee2fb..fea6d30a04715 100644
--- a/docs/content/learn-paimon/understand-files.md
+++ b/docs/content/learn-paimon/understand-files.md
@@ -316,8 +316,8 @@ made and contains the following information:
   "commitKind" : "COMPACT",
   "timeMillis" : 1684163217960,
   "logOffsets" : { },
-  "totalRecordCount" : 38,
-  "deltaRecordCount" : 20,
+  "totalRecordCount" : 2,
+  "deltaRecordCount" : -16,
   "changelogRecordCount" : 0,
   "watermark" : -9223372036854775808
 }

From 00a36e35bafbe10893725418443ea8fa1cd85c30 Mon Sep 17 00:00:00 2001
From: "liming.1018" <liming.1018@bytedance.com>
Date: Fri, 13 Dec 2024 09:50:29 +0800
Subject: [PATCH 150/157] [core] fix the issue where streaming reading of
 overwrite data would fail when retract type data appeared. (#4697)

---
 .../IncrementalChangelogReadProvider.java     |  8 ++--
 .../paimon/flink/ReadWriteTableITCase.java    | 37 +++++++++++++++++++
 2 files changed, 41 insertions(+), 4 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/splitread/IncrementalChangelogReadProvider.java b/paimon-core/src/main/java/org/apache/paimon/table/source/splitread/IncrementalChangelogReadProvider.java
index 308c09d142046..eb41d02669fc0 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/splitread/IncrementalChangelogReadProvider.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/splitread/IncrementalChangelogReadProvider.java
@@ -60,20 +60,20 @@ private SplitRead<InternalRow> create(Supplier<MergeFileSplitRead> supplier) {
                             ConcatRecordReader.create(
                                     () ->
                                             new ReverseReader(
-                                                    read.createNoMergeReader(
+                                                    read.createMergeReader(
                                                             split.partition(),
                                                             split.bucket(),
                                                             split.beforeFiles(),
                                                             split.beforeDeletionFiles()
                                                                     .orElse(null),
-                                                            true)),
+                                                            false)),
                                     () ->
-                                            read.createNoMergeReader(
+                                            read.createMergeReader(
                                                     split.partition(),
                                                     split.bucket(),
                                                     split.dataFiles(),
                                                     split.deletionFiles().orElse(null),
-                                                    true));
+                                                    false));
                     return unwrap(reader);
                 };
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ReadWriteTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ReadWriteTableITCase.java
index 10de1ae4839f1..732e964542368 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ReadWriteTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/ReadWriteTableITCase.java
@@ -801,6 +801,43 @@ public void testStreamingReadOverwriteWithoutPartitionedRecords() throws Excepti
         streamingItr.close();
     }
 
+    @Test
+    public void testStreamingReadOverwriteWithDeleteRecords() throws Exception {
+        String table =
+                createTable(
+                        Arrays.asList("currency STRING", "rate BIGINT", "dt STRING"),
+                        Collections.singletonList("currency"),
+                        Collections.emptyList(),
+                        Collections.emptyList(),
+                        streamingReadOverwrite);
+
+        insertInto(
+                table,
+                "('US Dollar', 102, '2022-01-01')",
+                "('Yen', 1, '2022-01-02')",
+                "('Euro', 119, '2022-01-02')");
+
+        bEnv.executeSql(String.format("DELETE FROM %s WHERE currency = 'Euro'", table)).await();
+
+        checkFileStorePath(table, Collections.emptyList());
+
+        // test projection and filter
+        BlockingIterator<Row, Row> streamingItr =
+                testStreamingRead(
+                        buildQuery(table, "currency, rate", "WHERE dt = '2022-01-02'"),
+                        Collections.singletonList(changelogRow("+I", "Yen", 1L)));
+
+        insertOverwrite(table, "('US Dollar', 100, '2022-01-02')", "('Yen', 10, '2022-01-01')");
+
+        validateStreamingReadResult(
+                streamingItr,
+                Arrays.asList(
+                        changelogRow("-D", "Yen", 1L), changelogRow("+I", "US Dollar", 100L)));
+        assertNoMoreRecords(streamingItr);
+
+        streamingItr.close();
+    }
+
     @Test
     public void testUnsupportStreamingReadOverwriteWithoutPk() {
         assertThatThrownBy(

From 3a7d8688aef22e03b97c24875d918f4e4768a810 Mon Sep 17 00:00:00 2001
From: YeJunHao <41894543+leaves12138@users.noreply.github.com>
Date: Fri, 13 Dec 2024 14:24:23 +0800
Subject: [PATCH 151/157] [core] Introduce data-file.thin-mode in primary key
 table write (#4666)

This closes #4666.
---
 .../generated/core_configuration.html         |   6 +
 .../java/org/apache/paimon/CoreOptions.java   |  11 ++
 .../apache/paimon/KeyValueThinSerializer.java |  58 +++++++
 .../paimon/io/KeyValueDataFileWriter.java     |  26 ++-
 .../paimon/io/KeyValueDataFileWriterImpl.java |  80 +++++++++
 .../paimon/io/KeyValueFileWriterFactory.java  | 103 +++++++++---
 .../io/KeyValueThinDataFileWriterImpl.java    | 128 ++++++++++++++
 .../operation/AppendOnlyFileStoreWrite.java   |   3 +
 .../apache/paimon/tag/TagAutoCreation.java    |   6 +
 .../org/apache/paimon/tag/TagAutoManager.java |   1 +
 .../paimon/utils/StatsCollectorFactories.java |  12 +-
 .../apache/paimon/TestKeyValueGenerator.java  |  10 +-
 .../paimon/format/ThinModeReadWriteTest.java  | 158 ++++++++++++++++++
 .../paimon/io/KeyValueFileReadWriteTest.java  |   3 +-
 .../paimon/mergetree/ContainsLevelsTest.java  |   8 +-
 .../paimon/mergetree/LookupLevelsTest.java    |   5 +-
 .../operation/MergeFileSplitReadTest.java     |   8 +-
 .../apache/paimon/stats/StatsTableTest.java   |  32 ++--
 .../apache/paimon/table/TableTestBase.java    |   4 +
 19 files changed, 601 insertions(+), 61 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/KeyValueThinSerializer.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriterImpl.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/io/KeyValueThinDataFileWriterImpl.java
 create mode 100644 paimon-core/src/test/java/org/apache/paimon/format/ThinModeReadWriteTest.java

diff --git a/docs/layouts/shortcodes/generated/core_configuration.html b/docs/layouts/shortcodes/generated/core_configuration.html
index b2bd3a976d66d..15b1aac93543a 100644
--- a/docs/layouts/shortcodes/generated/core_configuration.html
+++ b/docs/layouts/shortcodes/generated/core_configuration.html
@@ -864,6 +864,12 @@
             <td>Integer</td>
             <td>Default spill compression zstd level. For higher compression rates, it can be configured to 9, but the read and write speed will significantly decrease.</td>
         </tr>
+        <tr>
+            <td><h5>data-file.thin-mode</h5></td>
+            <td style="word-wrap: break-word;">false</td>
+            <td>Boolean</td>
+            <td>Enable data file thin mode to avoid duplicate columns storage.</td>
+        </tr>
         <tr>
             <td><h5>streaming-read-mode</h5></td>
             <td style="word-wrap: break-word;">(none)</td>
diff --git a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
index 5db809cff1d1f..dd5632c18b42b 100644
--- a/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
+++ b/paimon-common/src/main/java/org/apache/paimon/CoreOptions.java
@@ -1452,6 +1452,13 @@ public class CoreOptions implements Serializable {
                             "For DELETE manifest entry in manifest file, drop stats to reduce memory and storage."
                                     + " Default value is false only for compatibility of old reader.");
 
+    public static final ConfigOption<Boolean> DATA_FILE_THIN_MODE =
+            key("data-file.thin-mode")
+                    .booleanType()
+                    .defaultValue(false)
+                    .withDescription(
+                            "Enable data file thin mode to avoid duplicate columns storage.");
+
     @ExcludeFromDocumentation("Only used internally to support materialized table")
     public static final ConfigOption<String> MATERIALIZED_TABLE_DEFINITION_QUERY =
             key("materialized-table.definition-query")
@@ -2356,6 +2363,10 @@ public boolean statsDenseStore() {
         return options.get(METADATA_STATS_DENSE_STORE);
     }
 
+    public boolean dataFileThinMode() {
+        return options.get(DATA_FILE_THIN_MODE);
+    }
+
     /** Specifies the merge engine for table with primary key. */
     public enum MergeEngine implements DescribedEnum {
         DEDUPLICATE("deduplicate", "De-duplicate and keep the last row."),
diff --git a/paimon-core/src/main/java/org/apache/paimon/KeyValueThinSerializer.java b/paimon-core/src/main/java/org/apache/paimon/KeyValueThinSerializer.java
new file mode 100644
index 0000000000000..6dd41a42506ae
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/KeyValueThinSerializer.java
@@ -0,0 +1,58 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon;
+
+import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.JoinedRow;
+import org.apache.paimon.types.RowKind;
+import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.ObjectSerializer;
+
+/** Serialize KeyValue to InternalRow with ignorance of key. Only used to write KeyValue to disk. */
+public class KeyValueThinSerializer extends ObjectSerializer<KeyValue> {
+
+    private static final long serialVersionUID = 1L;
+
+    private final GenericRow reusedMeta;
+    private final JoinedRow reusedKeyWithMeta;
+
+    public KeyValueThinSerializer(RowType keyType, RowType valueType) {
+        super(KeyValue.schema(keyType, valueType));
+
+        this.reusedMeta = new GenericRow(2);
+        this.reusedKeyWithMeta = new JoinedRow();
+    }
+
+    public InternalRow toRow(KeyValue record) {
+        return toRow(record.sequenceNumber(), record.valueKind(), record.value());
+    }
+
+    public InternalRow toRow(long sequenceNumber, RowKind valueKind, InternalRow value) {
+        reusedMeta.setField(0, sequenceNumber);
+        reusedMeta.setField(1, valueKind.toByteValue());
+        return reusedKeyWithMeta.replace(reusedMeta, value);
+    }
+
+    @Override
+    public KeyValue fromRow(InternalRow row) {
+        throw new UnsupportedOperationException(
+                "KeyValue cannot be deserialized from InternalRow by this serializer.");
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriter.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriter.java
index ce0b3b02840ba..651c6a6f7b564 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriter.java
@@ -42,7 +42,6 @@
 import javax.annotation.Nullable;
 
 import java.io.IOException;
-import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
 import java.util.function.Function;
@@ -56,13 +55,13 @@
  * <p>NOTE: records given to the writer must be sorted because it does not compare the min max keys
  * to produce {@link DataFileMeta}.
  */
-public class KeyValueDataFileWriter
+public abstract class KeyValueDataFileWriter
         extends StatsCollectingSingleFileWriter<KeyValue, DataFileMeta> {
 
     private static final Logger LOG = LoggerFactory.getLogger(KeyValueDataFileWriter.class);
 
-    private final RowType keyType;
-    private final RowType valueType;
+    protected final RowType keyType;
+    protected final RowType valueType;
     private final long schemaId;
     private final int level;
 
@@ -85,6 +84,7 @@ public KeyValueDataFileWriter(
             Function<KeyValue, InternalRow> converter,
             RowType keyType,
             RowType valueType,
+            RowType writeRowType,
             @Nullable SimpleStatsExtractor simpleStatsExtractor,
             long schemaId,
             int level,
@@ -97,11 +97,11 @@ public KeyValueDataFileWriter(
                 factory,
                 path,
                 converter,
-                KeyValue.schema(keyType, valueType),
+                writeRowType,
                 simpleStatsExtractor,
                 compression,
                 StatsCollectorFactories.createStatsFactories(
-                        options, KeyValue.schema(keyType, valueType).getFieldNames()),
+                        options, writeRowType.getFieldNames(), keyType.getFieldNames()),
                 options.asyncFileWrite());
 
         this.keyType = keyType;
@@ -166,17 +166,11 @@ public DataFileMeta result() throws IOException {
             return null;
         }
 
-        SimpleColStats[] rowStats = fieldStats();
-        int numKeyFields = keyType.getFieldCount();
-
-        SimpleColStats[] keyFieldStats = Arrays.copyOfRange(rowStats, 0, numKeyFields);
-        SimpleStats keyStats = keyStatsConverter.toBinaryAllMode(keyFieldStats);
-
-        SimpleColStats[] valFieldStats =
-                Arrays.copyOfRange(rowStats, numKeyFields + 2, rowStats.length);
+        Pair<SimpleColStats[], SimpleColStats[]> keyValueStats = fetchKeyValueStats(fieldStats());
 
+        SimpleStats keyStats = keyStatsConverter.toBinaryAllMode(keyValueStats.getKey());
         Pair<List<String>, SimpleStats> valueStatsPair =
-                valueStatsConverter.toBinary(valFieldStats);
+                valueStatsConverter.toBinary(keyValueStats.getValue());
 
         DataFileIndexWriter.FileIndexResult indexResult =
                 dataFileIndexWriter == null
@@ -204,6 +198,8 @@ public DataFileMeta result() throws IOException {
                 valueStatsPair.getKey());
     }
 
+    abstract Pair<SimpleColStats[], SimpleColStats[]> fetchKeyValueStats(SimpleColStats[] rowStats);
+
     @Override
     public void close() throws IOException {
         if (dataFileIndexWriter != null) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriterImpl.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriterImpl.java
new file mode 100644
index 0000000000000..27a1aef64e36f
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueDataFileWriterImpl.java
@@ -0,0 +1,80 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.io;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.KeyValue;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.fileindex.FileIndexOptions;
+import org.apache.paimon.format.FormatWriterFactory;
+import org.apache.paimon.format.SimpleColStats;
+import org.apache.paimon.format.SimpleStatsExtractor;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.manifest.FileSource;
+import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.Pair;
+
+import javax.annotation.Nullable;
+
+import java.util.Arrays;
+import java.util.function.Function;
+
+/** Write data files containing {@link KeyValue}s. */
+public class KeyValueDataFileWriterImpl extends KeyValueDataFileWriter {
+
+    public KeyValueDataFileWriterImpl(
+            FileIO fileIO,
+            FormatWriterFactory factory,
+            Path path,
+            Function<KeyValue, InternalRow> converter,
+            RowType keyType,
+            RowType valueType,
+            @Nullable SimpleStatsExtractor simpleStatsExtractor,
+            long schemaId,
+            int level,
+            String compression,
+            CoreOptions options,
+            FileSource fileSource,
+            FileIndexOptions fileIndexOptions) {
+        super(
+                fileIO,
+                factory,
+                path,
+                converter,
+                keyType,
+                valueType,
+                KeyValue.schema(keyType, valueType),
+                simpleStatsExtractor,
+                schemaId,
+                level,
+                compression,
+                options,
+                fileSource,
+                fileIndexOptions);
+    }
+
+    @Override
+    Pair<SimpleColStats[], SimpleColStats[]> fetchKeyValueStats(SimpleColStats[] rowStats) {
+        int numKeyFields = keyType.getFieldCount();
+        return Pair.of(
+                Arrays.copyOfRange(rowStats, 0, numKeyFields),
+                Arrays.copyOfRange(rowStats, numKeyFields + 2, rowStats.length));
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileWriterFactory.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileWriterFactory.java
index a6fddb43283a1..a6aae3985bd4c 100644
--- a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileWriterFactory.java
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueFileWriterFactory.java
@@ -21,6 +21,7 @@
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.KeyValue;
 import org.apache.paimon.KeyValueSerializer;
+import org.apache.paimon.KeyValueThinSerializer;
 import org.apache.paimon.annotation.VisibleForTesting;
 import org.apache.paimon.data.BinaryRow;
 import org.apache.paimon.fileindex.FileIndexOptions;
@@ -31,6 +32,8 @@
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.manifest.FileSource;
 import org.apache.paimon.statistics.SimpleColStatsCollector;
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.FileStorePathFactory;
 import org.apache.paimon.utils.StatsCollectorFactories;
@@ -38,10 +41,13 @@
 import javax.annotation.Nullable;
 
 import java.io.IOException;
+import java.util.Collections;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.Optional;
+import java.util.Set;
 import java.util.function.Function;
+import java.util.stream.Collectors;
 
 /** A factory to create {@link FileWriter}s for writing {@link KeyValue} files. */
 public class KeyValueFileWriterFactory {
@@ -58,15 +64,13 @@ public class KeyValueFileWriterFactory {
     private KeyValueFileWriterFactory(
             FileIO fileIO,
             long schemaId,
-            RowType keyType,
-            RowType valueType,
             WriteFormatContext formatContext,
             long suggestedFileSize,
             CoreOptions options) {
         this.fileIO = fileIO;
         this.schemaId = schemaId;
-        this.keyType = keyType;
-        this.valueType = valueType;
+        this.keyType = formatContext.keyType;
+        this.valueType = formatContext.valueType;
         this.formatContext = formatContext;
         this.suggestedFileSize = suggestedFileSize;
         this.options = options;
@@ -107,21 +111,35 @@ public RollingFileWriter<KeyValue, DataFileMeta> createRollingChangelogFileWrite
 
     private KeyValueDataFileWriter createDataFileWriter(
             Path path, int level, FileSource fileSource) {
-        KeyValueSerializer kvSerializer = new KeyValueSerializer(keyType, valueType);
-        return new KeyValueDataFileWriter(
-                fileIO,
-                formatContext.writerFactory(level),
-                path,
-                kvSerializer::toRow,
-                keyType,
-                valueType,
-                formatContext.extractor(level),
-                schemaId,
-                level,
-                formatContext.compression(level),
-                options,
-                fileSource,
-                fileIndexOptions);
+        return formatContext.thinModeEnabled()
+                ? new KeyValueThinDataFileWriterImpl(
+                        fileIO,
+                        formatContext.writerFactory(level),
+                        path,
+                        new KeyValueThinSerializer(keyType, valueType)::toRow,
+                        keyType,
+                        valueType,
+                        formatContext.extractor(level),
+                        schemaId,
+                        level,
+                        formatContext.compression(level),
+                        options,
+                        fileSource,
+                        fileIndexOptions)
+                : new KeyValueDataFileWriterImpl(
+                        fileIO,
+                        formatContext.writerFactory(level),
+                        path,
+                        new KeyValueSerializer(keyType, valueType)::toRow,
+                        keyType,
+                        valueType,
+                        formatContext.extractor(level),
+                        schemaId,
+                        level,
+                        formatContext.compression(level),
+                        options,
+                        fileSource,
+                        fileIndexOptions);
     }
 
     public void deleteFile(String filename, int level) {
@@ -191,17 +209,17 @@ private Builder(
 
         public KeyValueFileWriterFactory build(
                 BinaryRow partition, int bucket, CoreOptions options) {
-            RowType fileRowType = KeyValue.schema(keyType, valueType);
             WriteFormatContext context =
                     new WriteFormatContext(
                             partition,
                             bucket,
-                            fileRowType,
+                            keyType,
+                            valueType,
                             fileFormat,
                             format2PathFactory,
                             options);
             return new KeyValueFileWriterFactory(
-                    fileIO, schemaId, keyType, valueType, context, suggestedFileSize, options);
+                    fileIO, schemaId, context, suggestedFileSize, options);
         }
     }
 
@@ -214,13 +232,24 @@ private static class WriteFormatContext {
         private final Map<String, DataFilePathFactory> format2PathFactory;
         private final Map<String, FormatWriterFactory> format2WriterFactory;
 
+        private final RowType keyType;
+        private final RowType valueType;
+        private final boolean thinModeEnabled;
+
         private WriteFormatContext(
                 BinaryRow partition,
                 int bucket,
-                RowType rowType,
+                RowType keyType,
+                RowType valueType,
                 FileFormat defaultFormat,
                 Map<String, FileStorePathFactory> parentFactories,
                 CoreOptions options) {
+            this.keyType = keyType;
+            this.valueType = valueType;
+            this.thinModeEnabled =
+                    options.dataFileThinMode() && supportsThinMode(keyType, valueType);
+            RowType writeRowType =
+                    KeyValue.schema(thinModeEnabled ? RowType.of() : keyType, valueType);
             Map<Integer, String> fileFormatPerLevel = options.fileFormatPerLevel();
             this.level2Format =
                     level ->
@@ -236,7 +265,10 @@ private WriteFormatContext(
             this.format2PathFactory = new HashMap<>();
             this.format2WriterFactory = new HashMap<>();
             SimpleColStatsCollector.Factory[] statsCollectorFactories =
-                    StatsCollectorFactories.createStatsFactories(options, rowType.getFieldNames());
+                    StatsCollectorFactories.createStatsFactories(
+                            options,
+                            writeRowType.getFieldNames(),
+                            thinModeEnabled ? keyType.getFieldNames() : Collections.emptyList());
             for (String format : parentFactories.keySet()) {
                 format2PathFactory.put(
                         format,
@@ -252,11 +284,30 @@ private WriteFormatContext(
                         format.equals("avro")
                                 ? Optional.empty()
                                 : fileFormat.createStatsExtractor(
-                                        rowType, statsCollectorFactories));
-                format2WriterFactory.put(format, fileFormat.createWriterFactory(rowType));
+                                        writeRowType, statsCollectorFactories));
+                format2WriterFactory.put(format, fileFormat.createWriterFactory(writeRowType));
             }
         }
 
+        private boolean supportsThinMode(RowType keyType, RowType valueType) {
+            Set<Integer> keyFieldIds =
+                    valueType.getFields().stream().map(DataField::id).collect(Collectors.toSet());
+
+            for (DataField field : keyType.getFields()) {
+                if (!SpecialFields.isKeyField(field.name())) {
+                    return false;
+                }
+                if (!keyFieldIds.contains(field.id() - SpecialFields.KEY_FIELD_ID_START)) {
+                    return false;
+                }
+            }
+            return true;
+        }
+
+        private boolean thinModeEnabled() {
+            return thinModeEnabled;
+        }
+
         @Nullable
         private SimpleStatsExtractor extractor(int level) {
             return format2Extractor.get(level2Format.apply(level)).orElse(null);
diff --git a/paimon-core/src/main/java/org/apache/paimon/io/KeyValueThinDataFileWriterImpl.java b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueThinDataFileWriterImpl.java
new file mode 100644
index 0000000000000..dd7ebb006764e
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/io/KeyValueThinDataFileWriterImpl.java
@@ -0,0 +1,128 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.io;
+
+import org.apache.paimon.CoreOptions;
+import org.apache.paimon.KeyValue;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.fileindex.FileIndexOptions;
+import org.apache.paimon.format.FormatWriterFactory;
+import org.apache.paimon.format.SimpleColStats;
+import org.apache.paimon.format.SimpleStatsExtractor;
+import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.manifest.FileSource;
+import org.apache.paimon.table.SpecialFields;
+import org.apache.paimon.types.RowType;
+import org.apache.paimon.utils.Pair;
+
+import javax.annotation.Nullable;
+
+import java.util.Arrays;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.function.Function;
+
+/**
+ * Implementation of KeyValueDataFileWriter for thin data files. Thin data files only contain
+ * _SEQUENCE_NUMBER_, _ROW_KIND_ and value fields.
+ */
+public class KeyValueThinDataFileWriterImpl extends KeyValueDataFileWriter {
+
+    private final int[] keyStatMapping;
+
+    /**
+     * Constructs a KeyValueThinDataFileWriterImpl.
+     *
+     * @param fileIO The file IO interface.
+     * @param factory The format writer factory.
+     * @param path The path to the file.
+     * @param converter The function to convert KeyValue to InternalRow.
+     * @param keyType The row type of the key.
+     * @param valueType The row type of the value.
+     * @param simpleStatsExtractor The simple stats extractor, can be null.
+     * @param schemaId The schema ID.
+     * @param level The level.
+     * @param compression The compression type.
+     * @param options The core options.
+     * @param fileSource The file source.
+     * @param fileIndexOptions The file index options.
+     */
+    public KeyValueThinDataFileWriterImpl(
+            FileIO fileIO,
+            FormatWriterFactory factory,
+            Path path,
+            Function<KeyValue, InternalRow> converter,
+            RowType keyType,
+            RowType valueType,
+            @Nullable SimpleStatsExtractor simpleStatsExtractor,
+            long schemaId,
+            int level,
+            String compression,
+            CoreOptions options,
+            FileSource fileSource,
+            FileIndexOptions fileIndexOptions) {
+        super(
+                fileIO,
+                factory,
+                path,
+                converter,
+                keyType,
+                valueType,
+                KeyValue.schema(RowType.of(), valueType),
+                simpleStatsExtractor,
+                schemaId,
+                level,
+                compression,
+                options,
+                fileSource,
+                fileIndexOptions);
+        Map<Integer, Integer> idToIndex = new HashMap<>(valueType.getFieldCount());
+        for (int i = 0; i < valueType.getFieldCount(); i++) {
+            idToIndex.put(valueType.getFields().get(i).id(), i);
+        }
+        this.keyStatMapping = new int[keyType.getFieldCount()];
+        for (int i = 0; i < keyType.getFieldCount(); i++) {
+            keyStatMapping[i] =
+                    idToIndex.get(
+                            keyType.getFields().get(i).id() - SpecialFields.KEY_FIELD_ID_START);
+        }
+    }
+
+    /**
+     * Fetches the key and value statistics.
+     *
+     * @param rowStats The row statistics.
+     * @return A pair of key statistics and value statistics.
+     */
+    @Override
+    Pair<SimpleColStats[], SimpleColStats[]> fetchKeyValueStats(SimpleColStats[] rowStats) {
+        int numKeyFields = keyType.getFieldCount();
+        // In thin mode, there is no key stats in rowStats, so we only jump
+        // _SEQUNCE_NUMBER_ and _ROW_KIND_ stats. Therefore, the 'from' value is 2.
+        SimpleColStats[] valFieldStats = Arrays.copyOfRange(rowStats, 2, rowStats.length);
+        // Thin mode on, so need to map value stats to key stats.
+        SimpleColStats[] keyStats = new SimpleColStats[numKeyFields];
+        for (int i = 0; i < keyStatMapping.length; i++) {
+            keyStats[i] = valFieldStats[keyStatMapping[i]];
+        }
+
+        return Pair.of(keyStats, valFieldStats);
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreWrite.java b/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreWrite.java
index 3ce019c916389..4a6196453df62 100644
--- a/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreWrite.java
+++ b/paimon-core/src/main/java/org/apache/paimon/operation/AppendOnlyFileStoreWrite.java
@@ -212,6 +212,9 @@ protected void forceBufferSpill() throws Exception {
         if (ioManager == null) {
             return;
         }
+        if (forceBufferSpill) {
+            return;
+        }
         forceBufferSpill = true;
         LOG.info(
                 "Force buffer spill for append-only file store write, writer number is: {}",
diff --git a/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoCreation.java b/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoCreation.java
index 58241033f5fb0..3989786bd2777 100644
--- a/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoCreation.java
+++ b/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoCreation.java
@@ -150,22 +150,28 @@ public void run() {
     private void tryToCreateTags(Snapshot snapshot) {
         Optional<LocalDateTime> timeOptional =
                 timeExtractor.extract(snapshot.timeMillis(), snapshot.watermark());
+        LOG.info("Starting to create a tag for snapshot {}.", snapshot.id());
         if (!timeOptional.isPresent()) {
             return;
         }
 
         LocalDateTime time = timeOptional.get();
+        LOG.info("The time of snapshot {} is {}.", snapshot.id(), time);
+        LOG.info("The next tag time is {}.", nextTag);
         if (nextTag == null
                 || isAfterOrEqual(time.minus(delay), periodHandler.nextTagTime(nextTag))) {
             LocalDateTime thisTag = periodHandler.normalizeToPreviousTag(time);
+            LOG.info("Create tag for snapshot {} with time {}.", snapshot.id(), thisTag);
             if (automaticCompletion && nextTag != null) {
                 thisTag = nextTag;
             }
             String tagName = periodHandler.timeToTag(thisTag);
+            LOG.info("The tag name is {}.", tagName);
             if (!tagManager.tagExists(tagName)) {
                 tagManager.createTag(snapshot, tagName, defaultTimeRetained, callbacks);
             }
             nextTag = periodHandler.nextTagTime(thisTag);
+            LOG.info("The next tag time after this is {}.", nextTag);
 
             if (numRetainedMax != null) {
                 // only handle auto-created tags here
diff --git a/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoManager.java b/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoManager.java
index 1ed1b3f2d4a27..817c20af46128 100644
--- a/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/tag/TagAutoManager.java
@@ -52,6 +52,7 @@ public static TagAutoManager create(
             TagManager tagManager,
             TagDeletion tagDeletion,
             List<TagCallback> callbacks) {
+
         TagTimeExtractor extractor = TagTimeExtractor.createForAutoTag(options);
 
         return new TagAutoManager(
diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/StatsCollectorFactories.java b/paimon-core/src/main/java/org/apache/paimon/utils/StatsCollectorFactories.java
index de94b2e23eff5..abb1d686073fb 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/StatsCollectorFactories.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/StatsCollectorFactories.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.statistics.TruncateSimpleColStatsCollector;
 import org.apache.paimon.table.SpecialFields;
 
+import java.util.Collections;
 import java.util.List;
 
 import static org.apache.paimon.CoreOptions.FIELDS_PREFIX;
@@ -35,6 +36,11 @@ public class StatsCollectorFactories {
 
     public static SimpleColStatsCollector.Factory[] createStatsFactories(
             CoreOptions options, List<String> fields) {
+        return createStatsFactories(options, fields, Collections.emptyList());
+    }
+
+    public static SimpleColStatsCollector.Factory[] createStatsFactories(
+            CoreOptions options, List<String> fields, List<String> keyNames) {
         Options cfg = options.toConfiguration();
         SimpleColStatsCollector.Factory[] modes =
                 new SimpleColStatsCollector.Factory[fields.size()];
@@ -47,7 +53,11 @@ public static SimpleColStatsCollector.Factory[] createStatsFactories(
                                     .noDefaultValue());
             if (fieldMode != null) {
                 modes[i] = SimpleColStatsCollector.from(fieldMode);
-            } else if (SpecialFields.isSystemField(field)) {
+            } else if (SpecialFields.isSystemField(field)
+                    ||
+                    // If we config DATA_FILE_THIN_MODE to true, we need to maintain the
+                    // stats for key fields.
+                    keyNames.contains(SpecialFields.KEY_FIELD_PREFIX + field)) {
                 modes[i] = () -> new TruncateSimpleColStatsCollector(128);
             } else {
                 modes[i] = SimpleColStatsCollector.from(cfg.get(CoreOptions.METADATA_STATS_MODE));
diff --git a/paimon-core/src/test/java/org/apache/paimon/TestKeyValueGenerator.java b/paimon-core/src/test/java/org/apache/paimon/TestKeyValueGenerator.java
index 657c791351a4a..587204cd76160 100644
--- a/paimon-core/src/test/java/org/apache/paimon/TestKeyValueGenerator.java
+++ b/paimon-core/src/test/java/org/apache/paimon/TestKeyValueGenerator.java
@@ -95,10 +95,12 @@ public class TestKeyValueGenerator {
     public static final RowType KEY_TYPE =
             RowType.of(
                     new DataField(
-                            2 + SpecialFields.KEY_FIELD_ID_START, "key_shopId", new IntType(false)),
+                            2 + SpecialFields.KEY_FIELD_ID_START,
+                            SpecialFields.KEY_FIELD_PREFIX + "shopId",
+                            new IntType(false)),
                     new DataField(
                             3 + SpecialFields.KEY_FIELD_ID_START,
-                            "key_orderId",
+                            SpecialFields.KEY_FIELD_PREFIX + "orderId",
                             new BigIntType(false)));
 
     public static final InternalRowSerializer DEFAULT_ROW_SERIALIZER =
@@ -281,7 +283,7 @@ public BinaryRow getPartition(KeyValue kv) {
     public static List<String> getPrimaryKeys(GeneratorMode mode) {
         List<String> trimmedPk =
                 KEY_TYPE.getFieldNames().stream()
-                        .map(f -> f.replaceFirst("key_", ""))
+                        .map(f -> f.replaceFirst(SpecialFields.KEY_FIELD_PREFIX, ""))
                         .collect(Collectors.toList());
         if (mode != NON_PARTITIONED) {
             trimmedPk = new ArrayList<>(trimmedPk);
@@ -394,7 +396,7 @@ public List<DataField> keyFields(TableSchema schema) {
                             f ->
                                     new DataField(
                                             f.id() + SpecialFields.KEY_FIELD_ID_START,
-                                            "key_" + f.name(),
+                                            SpecialFields.KEY_FIELD_PREFIX + f.name(),
                                             f.type(),
                                             f.description()))
                     .collect(Collectors.toList());
diff --git a/paimon-core/src/test/java/org/apache/paimon/format/ThinModeReadWriteTest.java b/paimon-core/src/test/java/org/apache/paimon/format/ThinModeReadWriteTest.java
new file mode 100644
index 0000000000000..3f8015b33b2dd
--- /dev/null
+++ b/paimon-core/src/test/java/org/apache/paimon/format/ThinModeReadWriteTest.java
@@ -0,0 +1,158 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.format;
+
+import org.apache.paimon.data.Decimal;
+import org.apache.paimon.data.GenericRow;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.Timestamp;
+import org.apache.paimon.manifest.FileKind;
+import org.apache.paimon.manifest.ManifestEntry;
+import org.apache.paimon.schema.Schema;
+import org.apache.paimon.table.FileStoreTable;
+import org.apache.paimon.table.Table;
+import org.apache.paimon.table.TableTestBase;
+import org.apache.paimon.types.DataTypes;
+
+import org.assertj.core.api.Assertions;
+import org.junit.jupiter.api.Test;
+
+import java.util.List;
+
+/** This class test the compatibility and effectiveness of storage thin mode. */
+public class ThinModeReadWriteTest extends TableTestBase {
+
+    private Table createTable(String format, Boolean thinMode) throws Exception {
+        catalog.createTable(identifier(), schema(format, thinMode), true);
+        return catalog.getTable(identifier());
+    }
+
+    private Schema schema(String format, Boolean thinMode) {
+        Schema.Builder schemaBuilder = Schema.newBuilder();
+        schemaBuilder.column("f0", DataTypes.INT());
+        schemaBuilder.column("f1", DataTypes.INT());
+        schemaBuilder.column("f2", DataTypes.SMALLINT());
+        schemaBuilder.column("f3", DataTypes.STRING());
+        schemaBuilder.column("f4", DataTypes.DOUBLE());
+        schemaBuilder.column("f5", DataTypes.CHAR(100));
+        schemaBuilder.column("f6", DataTypes.VARCHAR(100));
+        schemaBuilder.column("f7", DataTypes.BOOLEAN());
+        schemaBuilder.column("f8", DataTypes.INT());
+        schemaBuilder.column("f9", DataTypes.TIME());
+        schemaBuilder.column("f10", DataTypes.TIMESTAMP());
+        schemaBuilder.column("f11", DataTypes.DECIMAL(10, 2));
+        schemaBuilder.column("f12", DataTypes.BYTES());
+        schemaBuilder.column("f13", DataTypes.FLOAT());
+        schemaBuilder.column("f14", DataTypes.BINARY(100));
+        schemaBuilder.column("f15", DataTypes.VARBINARY(100));
+        schemaBuilder.primaryKey(
+                "f0", "f1", "f2", "f3", "f4", "f5", "f6", "f7", "f8", "f9", "f10", "f11", "f12",
+                "f13");
+        schemaBuilder.option("bucket", "1");
+        schemaBuilder.option("bucket-key", "f1");
+        schemaBuilder.option("file.format", format);
+        schemaBuilder.option("data-file.thin-mode", thinMode.toString());
+        return schemaBuilder.build();
+    }
+
+    @Test
+    public void testThinModeWorks() throws Exception {
+
+        InternalRow[] datas = datas(200000);
+
+        Table table = createTable("orc", true);
+        write(table, datas);
+
+        long size1 = tableSize(table);
+        dropTableDefault();
+
+        table = createTable("orc", false);
+        write(table, datas);
+        long size2 = tableSize(table);
+        dropTableDefault();
+
+        Assertions.assertThat(size2).isGreaterThan(size1);
+    }
+
+    @Test
+    public void testAllFormatReadWrite() throws Exception {
+        testFormat("orc");
+        testFormat("parquet");
+        testFormat("avro");
+    }
+
+    private void testFormat(String format) throws Exception {
+        testReadWrite(format, true);
+        testReadWrite(format, true);
+        testReadWrite(format, false);
+        testReadWrite(format, false);
+    }
+
+    private void testReadWrite(String format, boolean writeThin) throws Exception {
+        Table table = createTable(format, writeThin);
+
+        InternalRow[] datas = datas(2000);
+
+        write(table, datas);
+
+        List<InternalRow> readed = read(table);
+
+        Assertions.assertThat(readed).containsExactlyInAnyOrder(datas);
+        dropTableDefault();
+    }
+
+    InternalRow[] datas(int i) {
+        InternalRow[] arrays = new InternalRow[i];
+        for (int j = 0; j < i; j++) {
+            arrays[j] = data();
+        }
+        return arrays;
+    }
+
+    protected InternalRow data() {
+        return GenericRow.of(
+                RANDOM.nextInt(),
+                RANDOM.nextInt(),
+                (short) RANDOM.nextInt(),
+                randomString(),
+                RANDOM.nextDouble(),
+                randomString(),
+                randomString(),
+                RANDOM.nextBoolean(),
+                RANDOM.nextInt(),
+                RANDOM.nextInt(),
+                Timestamp.now(),
+                Decimal.zero(10, 2),
+                randomBytes(),
+                (float) RANDOM.nextDouble(),
+                randomBytes(),
+                randomBytes());
+    }
+
+    public static long tableSize(Table table) {
+        long count = 0;
+        List<ManifestEntry> files =
+                ((FileStoreTable) table).store().newScan().plan().files(FileKind.ADD);
+        for (ManifestEntry file : files) {
+            count += file.file().fileSize();
+        }
+
+        return count;
+    }
+}
diff --git a/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java b/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
index b648e2af89727..e43cd898dbc2a 100644
--- a/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/io/KeyValueFileReadWriteTest.java
@@ -37,6 +37,7 @@
 import org.apache.paimon.options.Options;
 import org.apache.paimon.reader.RecordReaderIterator;
 import org.apache.paimon.stats.StatsTestUtils;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.CloseableIterator;
 import org.apache.paimon.utils.FailingFileIO;
@@ -158,7 +159,7 @@ public void testReadKeyType() throws Exception {
         List<DataFileMeta> actualMetas = writer.result();
 
         // projection: (shopId, orderId) -> (orderId)
-        RowType readKeyType = KEY_TYPE.project("key_orderId");
+        RowType readKeyType = KEY_TYPE.project(SpecialFields.KEY_FIELD_PREFIX + "orderId");
         KeyValueFileReaderFactory readerFactory =
                 createReaderFactory(tempDir.toString(), "avro", readKeyType, null);
         InternalRowSerializer projectedKeySerializer = new InternalRowSerializer(readKeyType);
diff --git a/paimon-core/src/test/java/org/apache/paimon/mergetree/ContainsLevelsTest.java b/paimon-core/src/test/java/org/apache/paimon/mergetree/ContainsLevelsTest.java
index 0ab636c33aa3e..be49311427a05 100644
--- a/paimon-core/src/test/java/org/apache/paimon/mergetree/ContainsLevelsTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/mergetree/ContainsLevelsTest.java
@@ -41,6 +41,7 @@
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.SchemaEvolutionTableTestBase;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowKind;
@@ -77,7 +78,12 @@ public class ContainsLevelsTest {
 
     private final Comparator<InternalRow> comparator = Comparator.comparingInt(o -> o.getInt(0));
 
-    private final RowType keyType = DataTypes.ROW(DataTypes.FIELD(0, "_key", DataTypes.INT()));
+    private final RowType keyType =
+            DataTypes.ROW(
+                    DataTypes.FIELD(
+                            SpecialFields.KEY_FIELD_ID_START,
+                            SpecialFields.KEY_FIELD_PREFIX + "key",
+                            DataTypes.INT()));
     private final RowType rowType =
             DataTypes.ROW(
                     DataTypes.FIELD(0, "key", DataTypes.INT()),
diff --git a/paimon-core/src/test/java/org/apache/paimon/mergetree/LookupLevelsTest.java b/paimon-core/src/test/java/org/apache/paimon/mergetree/LookupLevelsTest.java
index 2dce81ce56b4e..a678534042eb9 100644
--- a/paimon-core/src/test/java/org/apache/paimon/mergetree/LookupLevelsTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/mergetree/LookupLevelsTest.java
@@ -41,6 +41,7 @@
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
 import org.apache.paimon.table.SchemaEvolutionTableTestBase;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.types.DataField;
 import org.apache.paimon.types.DataTypes;
 import org.apache.paimon.types.RowKind;
@@ -79,7 +80,9 @@ public class LookupLevelsTest {
 
     private final Comparator<InternalRow> comparator = Comparator.comparingInt(o -> o.getInt(0));
 
-    private final RowType keyType = DataTypes.ROW(DataTypes.FIELD(0, "_key", DataTypes.INT()));
+    private final RowType keyType =
+            DataTypes.ROW(
+                    DataTypes.FIELD(SpecialFields.KEY_FIELD_ID_START, "_KEY_key", DataTypes.INT()));
     private final RowType rowType =
             DataTypes.ROW(
                     DataTypes.FIELD(0, "key", DataTypes.INT()),
diff --git a/paimon-core/src/test/java/org/apache/paimon/operation/MergeFileSplitReadTest.java b/paimon-core/src/test/java/org/apache/paimon/operation/MergeFileSplitReadTest.java
index 46b64422fd9b2..59f848a296cf6 100644
--- a/paimon-core/src/test/java/org/apache/paimon/operation/MergeFileSplitReadTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/operation/MergeFileSplitReadTest.java
@@ -37,6 +37,7 @@
 import org.apache.paimon.schema.Schema;
 import org.apache.paimon.schema.SchemaManager;
 import org.apache.paimon.schema.TableSchema;
+import org.apache.paimon.table.SpecialFields;
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.types.BigIntType;
 import org.apache.paimon.types.DataField;
@@ -284,7 +285,12 @@ private TestFileStore createStore(
                                 ? Collections.emptyList()
                                 : Stream.concat(
                                                 keyType.getFieldNames().stream()
-                                                        .map(field -> field.replace("key_", "")),
+                                                        .map(
+                                                                field ->
+                                                                        field.replace(
+                                                                                SpecialFields
+                                                                                        .KEY_FIELD_PREFIX,
+                                                                                "")),
                                                 partitionType.getFieldNames().stream())
                                         .collect(Collectors.toList()),
                         Collections.emptyMap(),
diff --git a/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java b/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
index 25282d898a3dd..ce8cfc9228adf 100644
--- a/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/stats/StatsTableTest.java
@@ -33,7 +33,8 @@
 import org.apache.paimon.table.TableTestBase;
 import org.apache.paimon.types.DataTypes;
 
-import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.ValueSource;
 
 import static org.apache.paimon.CoreOptions.METADATA_STATS_DENSE_STORE;
 import static org.apache.paimon.CoreOptions.METADATA_STATS_MODE;
@@ -42,13 +43,15 @@
 /** Test for table stats mode. */
 public class StatsTableTest extends TableTestBase {
 
-    @Test
-    public void testPartitionStatsNotDense() throws Exception {
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testPartitionStatsNotDense(boolean thinMode) throws Exception {
         Identifier identifier = identifier("T");
         Options options = new Options();
         options.set(METADATA_STATS_MODE, "NONE");
         options.set(METADATA_STATS_DENSE_STORE, false);
         options.set(CoreOptions.BUCKET, 1);
+        options.set(CoreOptions.DATA_FILE_THIN_MODE, thinMode);
         Schema schema =
                 Schema.newBuilder()
                         .column("pt", DataTypes.INT())
@@ -86,19 +89,25 @@ public void testPartitionStatsNotDense() throws Exception {
                 manifestFile.read(manifest.fileName(), manifest.fileSize()).get(0).file();
         SimpleStats recordStats = file.valueStats();
         assertThat(recordStats.minValues().isNullAt(0)).isTrue();
-        assertThat(recordStats.minValues().isNullAt(1)).isTrue();
+        assertThat(recordStats.minValues().isNullAt(1)).isEqualTo(!thinMode);
         assertThat(recordStats.minValues().isNullAt(2)).isTrue();
         assertThat(recordStats.maxValues().isNullAt(0)).isTrue();
-        assertThat(recordStats.maxValues().isNullAt(1)).isTrue();
+        assertThat(recordStats.maxValues().isNullAt(1)).isEqualTo(!thinMode);
         assertThat(recordStats.maxValues().isNullAt(2)).isTrue();
+
+        SimpleStats keyStats = file.keyStats();
+        assertThat(keyStats.minValues().isNullAt(0)).isFalse();
+        assertThat(keyStats.maxValues().isNullAt(0)).isFalse();
     }
 
-    @Test
-    public void testPartitionStatsDenseMode() throws Exception {
+    @ParameterizedTest
+    @ValueSource(booleans = {true, false})
+    public void testPartitionStatsDenseMode(boolean thinMode) throws Exception {
         Identifier identifier = identifier("T");
         Options options = new Options();
         options.set(METADATA_STATS_MODE, "NONE");
         options.set(CoreOptions.BUCKET, 1);
+        options.set(CoreOptions.DATA_FILE_THIN_MODE, thinMode);
         Schema schema =
                 Schema.newBuilder()
                         .column("pt", DataTypes.INT())
@@ -135,9 +144,10 @@ public void testPartitionStatsDenseMode() throws Exception {
         DataFileMeta file =
                 manifestFile.read(manifest.fileName(), manifest.fileSize()).get(0).file();
         SimpleStats recordStats = file.valueStats();
-        assertThat(file.valueStatsCols()).isEmpty();
-        assertThat(recordStats.minValues().getFieldCount()).isEqualTo(0);
-        assertThat(recordStats.maxValues().getFieldCount()).isEqualTo(0);
-        assertThat(recordStats.nullCounts().size()).isEqualTo(0);
+        int count = thinMode ? 1 : 0;
+        assertThat(file.valueStatsCols().size()).isEqualTo(count);
+        assertThat(recordStats.minValues().getFieldCount()).isEqualTo(count);
+        assertThat(recordStats.maxValues().getFieldCount()).isEqualTo(count);
+        assertThat(recordStats.nullCounts().size()).isEqualTo(count);
     }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/TableTestBase.java b/paimon-core/src/test/java/org/apache/paimon/table/TableTestBase.java
index 7f850a7725b4c..7d7617cf8bd1a 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/TableTestBase.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/TableTestBase.java
@@ -160,6 +160,10 @@ protected void compact(
         }
     }
 
+    public void dropTableDefault() throws Exception {
+        catalog.dropTable(identifier(), true);
+    }
+
     protected List<InternalRow> read(Table table, Pair<ConfigOption<?>, String>... dynamicOptions)
             throws Exception {
         return read(table, null, dynamicOptions);

From a2631704b5e53f530a54bbb5e1f734a330aad5fc Mon Sep 17 00:00:00 2001
From: YeJunHao <41894543+leaves12138@users.noreply.github.com>
Date: Fri, 13 Dec 2024 14:43:46 +0800
Subject: [PATCH 152/157] [core] Retry if snapshot commit hint failed. (#4701)

---
 .../apache/paimon/utils/SnapshotManager.java  | 20 ++++++++++++++++++-
 1 file changed, 19 insertions(+), 1 deletion(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
index eb7333366fece..49da83bfe48a9 100644
--- a/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
+++ b/paimon-core/src/main/java/org/apache/paimon/utils/SnapshotManager.java
@@ -45,6 +45,7 @@
 import java.util.Optional;
 import java.util.Set;
 import java.util.concurrent.ExecutorService;
+import java.util.concurrent.ThreadLocalRandom;
 import java.util.concurrent.TimeUnit;
 import java.util.function.BinaryOperator;
 import java.util.function.Consumer;
@@ -883,6 +884,23 @@ public void commitEarliestHint(long snapshotId) throws IOException {
 
     private void commitHint(long snapshotId, String fileName, Path dir) throws IOException {
         Path hintFile = new Path(dir, fileName);
-        fileIO.overwriteFileUtf8(hintFile, String.valueOf(snapshotId));
+        int loopTime = 3;
+        while (loopTime-- > 0) {
+            try {
+                fileIO.overwriteFileUtf8(hintFile, String.valueOf(snapshotId));
+                return;
+            } catch (IOException e) {
+                try {
+                    Thread.sleep(ThreadLocalRandom.current().nextInt(1000) + 500);
+                } catch (InterruptedException ex) {
+                    Thread.currentThread().interrupt();
+                    // throw root cause
+                    throw new RuntimeException(e);
+                }
+                if (loopTime == 0) {
+                    throw e;
+                }
+            }
+        }
     }
 }

From 1956f248b4014fa655f8016074102f9c7c16d381 Mon Sep 17 00:00:00 2001
From: yunfengzhou-hub <yuri.zhouyunfeng@outlook.com>
Date: Fri, 13 Dec 2024 17:10:56 +0800
Subject: [PATCH 153/157] [flink] Replace legacy SourceFunction with v2 Source
 (#4614)

This closes #4614.
---
 paimon-flink/paimon-flink-1.20/pom.xml        |  14 ++
 .../action/cdc/SynchronizationActionBase.java |  62 +++--
 .../sink/cdc/FlinkCdcMultiTableSinkTest.java  |  10 +-
 .../cdc/FlinkCdcSyncDatabaseSinkITCase.java   |   6 +-
 .../sink/cdc/FlinkCdcSyncTableSinkITCase.java |   6 +-
 .../paimon/flink/sink/cdc/TestCdcSource.java  | 126 ++++++++++
 .../flink/sink/cdc/TestCdcSourceFunction.java | 107 ---------
 .../compact/MultiAwareBucketTableScan.java    |  12 +-
 .../flink/compact/MultiTableScanBase.java     |  14 +-
 .../compact/MultiUnawareBucketTableScan.java  |  12 +-
 .../UnawareBucketCompactionTopoBuilder.java   |   2 +-
 .../flink/service/QueryFileMonitor.java       |  99 ++++----
 .../source/AbstractNonCoordinatedSource.java  |  50 ++++
 .../AbstractNonCoordinatedSourceReader.java   |  51 ++++
 .../source/BucketUnawareCompactSource.java    | 116 ++++-----
 .../CombinedTableCompactorSourceBuilder.java  |  16 +-
 .../flink/source/FlinkSourceBuilder.java      |   4 +-
 .../paimon/flink/source/NoOpEnumState.java    |  22 ++
 .../flink/source/NoOpEnumStateSerializer.java |  41 ++++
 .../paimon/flink/source/NoOpEnumerator.java   |  54 +++++
 .../flink/source/SimpleSourceSplit.java       |  51 ++++
 .../source/SimpleSourceSplitSerializer.java   |  77 ++++++
 .../paimon/flink/source/SplitListState.java   |  92 ++++++++
 ...ion.java => CombinedAwareBatchSource.java} |  95 ++++----
 ...java => CombinedAwareStreamingSource.java} |  98 ++++----
 ...tion.java => CombinedCompactorSource.java} |  47 +---
 ...n.java => CombinedUnawareBatchSource.java} | 103 ++++----
 ...va => CombinedUnawareStreamingSource.java} | 102 ++++----
 ...onitorFunction.java => MonitorSource.java} | 220 ++++++++----------
 .../operator/MultiTablesReadOperator.java     |   5 +-
 .../MultiUnawareTablesReadOperator.java       |   2 +-
 .../flink/source/operator/ReadOperator.java   |   4 +-
 .../apache/paimon/flink/FileStoreITCase.java  |  18 +-
 .../apache/paimon/flink/FiniteTestSource.java | 169 +++++++-------
 .../paimon/flink/SerializableRowData.java     |   4 +-
 .../UnawareBucketAppendOnlyTableITCase.java   |  90 ++++---
 .../source/operator/OperatorSourceTest.java   | 113 +++++----
 .../operator/TestingSourceOperator.java       | 184 +++++++++++++++
 38 files changed, 1433 insertions(+), 865 deletions(-)
 create mode 100644 paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSource.java
 delete mode 100644 paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSourceFunction.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSource.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSourceReader.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumState.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumStateSerializer.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumerator.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplit.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplitSerializer.java
 create mode 100644 paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SplitListState.java
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{CombinedAwareBatchSourceFunction.java => CombinedAwareBatchSource.java} (66%)
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{CombinedAwareStreamingSourceFunction.java => CombinedAwareStreamingSource.java} (63%)
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{CombinedCompactorSourceFunction.java => CombinedCompactorSource.java} (63%)
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{CombinedUnawareBatchSourceFunction.java => CombinedUnawareBatchSource.java} (71%)
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{CombinedUnawareStreamingSourceFunction.java => CombinedUnawareStreamingSource.java} (57%)
 rename paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/{MonitorFunction.java => MonitorSource.java} (53%)
 create mode 100644 paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/TestingSourceOperator.java

diff --git a/paimon-flink/paimon-flink-1.20/pom.xml b/paimon-flink/paimon-flink-1.20/pom.xml
index 7cf1d8e98df71..f15792d2bea9e 100644
--- a/paimon-flink/paimon-flink-1.20/pom.xml
+++ b/paimon-flink/paimon-flink-1.20/pom.xml
@@ -55,6 +55,20 @@ under the License.
                 </exclusion>
             </exclusions>
         </dependency>
+
+        <dependency>
+            <groupId>org.apache.flink</groupId>
+            <artifactId>flink-streaming-java</artifactId>
+            <version>${flink.version}</version>
+            <scope>provided</scope>
+        </dependency>
+
+        <dependency>
+            <groupId>org.apache.flink</groupId>
+            <artifactId>flink-table-common</artifactId>
+            <version>${flink.version}</version>
+            <scope>provided</scope>
+        </dependency>
     </dependencies>
 
     <build>
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SynchronizationActionBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SynchronizationActionBase.java
index f103396389e5e..a7c770347410a 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SynchronizationActionBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SynchronizationActionBase.java
@@ -40,7 +40,6 @@
 import org.apache.flink.configuration.ExecutionOptions;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
-import org.apache.flink.streaming.api.functions.source.SourceFunction;
 
 import java.time.Duration;
 import java.util.HashMap;
@@ -131,7 +130,7 @@ public void build() throws Exception {
 
     protected void beforeBuildingSourceSink() throws Exception {}
 
-    protected Object buildSource() {
+    protected Source<CdcSourceRecord, ?, ?> buildSource() {
         return syncJobHandler.provideSource();
     }
 
@@ -147,41 +146,32 @@ protected void validateRuntimeExecutionMode() {
                 "It's only support STREAMING mode for flink-cdc sync table action.");
     }
 
-    private DataStreamSource<CdcSourceRecord> buildDataStreamSource(Object source) {
-        if (source instanceof Source) {
-            boolean isAutomaticWatermarkCreationEnabled =
-                    tableConfig.containsKey(CoreOptions.TAG_AUTOMATIC_CREATION.key())
-                            && Objects.equals(
-                                    tableConfig.get(CoreOptions.TAG_AUTOMATIC_CREATION.key()),
-                                    WATERMARK.toString());
-
-            Options options = Options.fromMap(tableConfig);
-            Duration idleTimeout = options.get(SCAN_WATERMARK_IDLE_TIMEOUT);
-            String watermarkAlignGroup = options.get(SCAN_WATERMARK_ALIGNMENT_GROUP);
-            WatermarkStrategy<CdcSourceRecord> watermarkStrategy =
-                    isAutomaticWatermarkCreationEnabled
-                            ? watermarkAlignGroup != null
-                                    ? new CdcWatermarkStrategy(createCdcTimestampExtractor())
-                                            .withWatermarkAlignment(
-                                                    watermarkAlignGroup,
-                                                    options.get(SCAN_WATERMARK_ALIGNMENT_MAX_DRIFT),
-                                                    options.get(
-                                                            SCAN_WATERMARK_ALIGNMENT_UPDATE_INTERVAL))
-                                    : new CdcWatermarkStrategy(createCdcTimestampExtractor())
-                            : WatermarkStrategy.noWatermarks();
-            if (idleTimeout != null) {
-                watermarkStrategy = watermarkStrategy.withIdleness(idleTimeout);
-            }
-            return env.fromSource(
-                    (Source<CdcSourceRecord, ?, ?>) source,
-                    watermarkStrategy,
-                    syncJobHandler.provideSourceName());
+    private DataStreamSource<CdcSourceRecord> buildDataStreamSource(
+            Source<CdcSourceRecord, ?, ?> source) {
+        boolean isAutomaticWatermarkCreationEnabled =
+                tableConfig.containsKey(CoreOptions.TAG_AUTOMATIC_CREATION.key())
+                        && Objects.equals(
+                                tableConfig.get(CoreOptions.TAG_AUTOMATIC_CREATION.key()),
+                                WATERMARK.toString());
+
+        Options options = Options.fromMap(tableConfig);
+        Duration idleTimeout = options.get(SCAN_WATERMARK_IDLE_TIMEOUT);
+        String watermarkAlignGroup = options.get(SCAN_WATERMARK_ALIGNMENT_GROUP);
+        WatermarkStrategy<CdcSourceRecord> watermarkStrategy =
+                isAutomaticWatermarkCreationEnabled
+                        ? watermarkAlignGroup != null
+                                ? new CdcWatermarkStrategy(createCdcTimestampExtractor())
+                                        .withWatermarkAlignment(
+                                                watermarkAlignGroup,
+                                                options.get(SCAN_WATERMARK_ALIGNMENT_MAX_DRIFT),
+                                                options.get(
+                                                        SCAN_WATERMARK_ALIGNMENT_UPDATE_INTERVAL))
+                                : new CdcWatermarkStrategy(createCdcTimestampExtractor())
+                        : WatermarkStrategy.noWatermarks();
+        if (idleTimeout != null) {
+            watermarkStrategy = watermarkStrategy.withIdleness(idleTimeout);
         }
-        if (source instanceof SourceFunction) {
-            return env.addSource(
-                    (SourceFunction<CdcSourceRecord>) source, syncJobHandler.provideSourceName());
-        }
-        throw new UnsupportedOperationException("Unrecognized source type");
+        return env.fromSource(source, watermarkStrategy, syncJobHandler.provideSourceName());
     }
 
     protected abstract FlatMapFunction<CdcSourceRecord, RichCdcMultiplexRecord> recordParse();
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
index 723f57a30e3f7..ab81e37c7d04b 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcMultiTableSinkTest.java
@@ -26,7 +26,6 @@
 import org.apache.flink.streaming.api.datastream.DataStreamSink;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.source.ParallelSourceFunction;
 import org.apache.flink.streaming.api.transformations.OneInputTransformation;
 import org.apache.flink.streaming.api.transformations.PartitionTransformation;
 import org.junit.jupiter.api.Test;
@@ -45,14 +44,7 @@ public void testTransformationParallelism() {
         env.setParallelism(8);
         int inputParallelism = ThreadLocalRandom.current().nextInt(8) + 1;
         DataStreamSource<CdcMultiplexRecord> input =
-                env.addSource(
-                                new ParallelSourceFunction<CdcMultiplexRecord>() {
-                                    @Override
-                                    public void run(SourceContext<CdcMultiplexRecord> ctx) {}
-
-                                    @Override
-                                    public void cancel() {}
-                                })
+                env.fromData(CdcMultiplexRecord.class, new CdcMultiplexRecord("", "", null))
                         .setParallelism(inputParallelism);
 
         FlinkCdcMultiTableSink sink =
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkITCase.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkITCase.java
index a7c6b2cb63238..28b137a93ed9c 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkITCase.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncDatabaseSinkITCase.java
@@ -42,6 +42,7 @@
 import org.apache.paimon.utils.FailingFileIO;
 import org.apache.paimon.utils.TraceableFileIO;
 
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.junit.jupiter.api.Test;
@@ -154,8 +155,9 @@ private void innerTestRandomCdcEvents(Supplier<Integer> bucket, boolean unawareB
                         .allowRestart(enableFailure)
                         .build();
 
-        TestCdcSourceFunction sourceFunction = new TestCdcSourceFunction(events);
-        DataStreamSource<TestCdcEvent> source = env.addSource(sourceFunction);
+        TestCdcSource testCdcSource = new TestCdcSource(events);
+        DataStreamSource<TestCdcEvent> source =
+                env.fromSource(testCdcSource, WatermarkStrategy.noWatermarks(), "TestCdcSource");
         source.setParallelism(2);
 
         Options catalogOptions = new Options();
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncTableSinkITCase.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncTableSinkITCase.java
index 081bd7d073d74..8b19391f3edab 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncTableSinkITCase.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/FlinkCdcSyncTableSinkITCase.java
@@ -43,6 +43,7 @@
 import org.apache.paimon.utils.FailingFileIO;
 import org.apache.paimon.utils.TraceableFileIO;
 
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
 import org.junit.jupiter.api.Disabled;
@@ -151,8 +152,9 @@ private void innerTestRandomCdcEvents(
                         .allowRestart(enableFailure)
                         .build();
 
-        TestCdcSourceFunction sourceFunction = new TestCdcSourceFunction(testTable.events());
-        DataStreamSource<TestCdcEvent> source = env.addSource(sourceFunction);
+        TestCdcSource testCdcSource = new TestCdcSource(testTable.events());
+        DataStreamSource<TestCdcEvent> source =
+                env.fromSource(testCdcSource, WatermarkStrategy.noWatermarks(), "TestCdcSource");
         source.setParallelism(2);
 
         Options catalogOptions = new Options();
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSource.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSource.java
new file mode 100644
index 0000000000000..b45983000a232
--- /dev/null
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSource.java
@@ -0,0 +1,126 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.sink.cdc;
+
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
+import org.apache.paimon.flink.source.SplitListState;
+
+import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
+
+import java.util.Collection;
+import java.util.LinkedList;
+import java.util.List;
+import java.util.concurrent.ThreadLocalRandom;
+import java.util.concurrent.atomic.AtomicInteger;
+
+/**
+ * Testing parallel {@link org.apache.flink.api.connector.source.Source} to produce {@link
+ * TestCdcEvent}. {@link TestCdcEvent}s with the same key will be produced by the same parallelism.
+ */
+public class TestCdcSource extends AbstractNonCoordinatedSource<TestCdcEvent> {
+
+    private static final long serialVersionUID = 1L;
+    private final LinkedList<TestCdcEvent> events;
+
+    public TestCdcSource(Collection<TestCdcEvent> events) {
+        this.events = new LinkedList<>(events);
+    }
+
+    @Override
+    public Boundedness getBoundedness() {
+        return Boundedness.CONTINUOUS_UNBOUNDED;
+    }
+
+    @Override
+    public SourceReader<TestCdcEvent, SimpleSourceSplit> createReader(SourceReaderContext context) {
+        return new Reader(
+                context.getIndexOfSubtask(),
+                context.currentParallelism(),
+                new LinkedList<>(events));
+    }
+
+    private static class Reader extends AbstractNonCoordinatedSourceReader<TestCdcEvent> {
+        private final int subtaskId;
+        private final int totalSubtasks;
+
+        private final LinkedList<TestCdcEvent> events;
+        private final SplitListState<Integer> remainingEventsCount =
+                new SplitListState<>("events", x -> Integer.toString(x), Integer::parseInt);
+
+        private final int numRecordsPerCheckpoint;
+        private final AtomicInteger recordsThisCheckpoint;
+
+        private Reader(int subtaskId, int totalSubtasks, LinkedList<TestCdcEvent> events) {
+            this.subtaskId = subtaskId;
+            this.totalSubtasks = totalSubtasks;
+            this.events = events;
+            numRecordsPerCheckpoint =
+                    events.size() / ThreadLocalRandom.current().nextInt(10, 20) + 1;
+            recordsThisCheckpoint = new AtomicInteger(0);
+        }
+
+        @Override
+        public InputStatus pollNext(ReaderOutput<TestCdcEvent> readerOutput) throws Exception {
+            if (events.isEmpty()) {
+                return InputStatus.END_OF_INPUT;
+            }
+
+            if (recordsThisCheckpoint.get() >= numRecordsPerCheckpoint) {
+                Thread.sleep(10);
+                return InputStatus.MORE_AVAILABLE;
+            }
+
+            TestCdcEvent event = events.poll();
+            if (event.records() != null) {
+                if (Math.abs(event.hashCode()) % totalSubtasks != subtaskId) {
+                    return InputStatus.MORE_AVAILABLE;
+                }
+            }
+            readerOutput.collect(event);
+            recordsThisCheckpoint.incrementAndGet();
+            return InputStatus.MORE_AVAILABLE;
+        }
+
+        @Override
+        public List<SimpleSourceSplit> snapshotState(long l) {
+            recordsThisCheckpoint.set(0);
+            remainingEventsCount.clear();
+            remainingEventsCount.add(events.size());
+            return remainingEventsCount.snapshotState();
+        }
+
+        @Override
+        public void addSplits(List<SimpleSourceSplit> list) {
+            remainingEventsCount.restoreState(list);
+            int count = 0;
+            for (int c : remainingEventsCount.get()) {
+                count += c;
+            }
+            while (events.size() > count) {
+                events.poll();
+            }
+        }
+    }
+}
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSourceFunction.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSourceFunction.java
deleted file mode 100644
index 4e03256a52532..0000000000000
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/sink/cdc/TestCdcSourceFunction.java
+++ /dev/null
@@ -1,107 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.paimon.flink.sink.cdc;
-
-import org.apache.flink.api.common.state.ListState;
-import org.apache.flink.api.common.state.ListStateDescriptor;
-import org.apache.flink.runtime.state.FunctionInitializationContext;
-import org.apache.flink.runtime.state.FunctionSnapshotContext;
-import org.apache.flink.streaming.api.checkpoint.CheckpointedFunction;
-import org.apache.flink.streaming.api.functions.source.RichParallelSourceFunction;
-
-import java.util.Collection;
-import java.util.LinkedList;
-import java.util.concurrent.ThreadLocalRandom;
-import java.util.concurrent.atomic.AtomicInteger;
-
-/**
- * Testing {@link RichParallelSourceFunction} to produce {@link TestCdcEvent}. {@link TestCdcEvent}s
- * with the same key will be produced by the same parallelism.
- */
-public class TestCdcSourceFunction extends RichParallelSourceFunction<TestCdcEvent>
-        implements CheckpointedFunction {
-
-    private static final long serialVersionUID = 1L;
-
-    private final LinkedList<TestCdcEvent> events;
-
-    private volatile boolean isRunning = true;
-    private transient int numRecordsPerCheckpoint;
-    private transient AtomicInteger recordsThisCheckpoint;
-    private transient ListState<Integer> remainingEventsCount;
-
-    public TestCdcSourceFunction(Collection<TestCdcEvent> events) {
-        this.events = new LinkedList<>(events);
-    }
-
-    @Override
-    public void initializeState(FunctionInitializationContext context) throws Exception {
-        numRecordsPerCheckpoint = events.size() / ThreadLocalRandom.current().nextInt(10, 20) + 1;
-        recordsThisCheckpoint = new AtomicInteger(0);
-
-        remainingEventsCount =
-                context.getOperatorStateStore()
-                        .getListState(new ListStateDescriptor<>("count", Integer.class));
-
-        if (context.isRestored()) {
-            int count = 0;
-            for (int c : remainingEventsCount.get()) {
-                count += c;
-            }
-            while (events.size() > count) {
-                events.poll();
-            }
-        }
-    }
-
-    @Override
-    public void snapshotState(FunctionSnapshotContext context) throws Exception {
-        recordsThisCheckpoint.set(0);
-        remainingEventsCount.clear();
-        remainingEventsCount.add(events.size());
-    }
-
-    @Override
-    public void run(SourceContext<TestCdcEvent> ctx) throws Exception {
-        while (isRunning && !events.isEmpty()) {
-            if (recordsThisCheckpoint.get() >= numRecordsPerCheckpoint) {
-                Thread.sleep(10);
-                continue;
-            }
-
-            synchronized (ctx.getCheckpointLock()) {
-                TestCdcEvent event = events.poll();
-                if (event.records() != null) {
-                    int subtaskId = getRuntimeContext().getIndexOfThisSubtask();
-                    int totalSubtasks = getRuntimeContext().getNumberOfParallelSubtasks();
-                    if (Math.abs(event.hashCode()) % totalSubtasks != subtaskId) {
-                        continue;
-                    }
-                }
-                ctx.collect(event);
-                recordsThisCheckpoint.incrementAndGet();
-            }
-        }
-    }
-
-    @Override
-    public void cancel() {
-        isRunning = false;
-    }
-}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiAwareBucketTableScan.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiAwareBucketTableScan.java
index 747995d20d675..88730132ef68c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiAwareBucketTableScan.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiAwareBucketTableScan.java
@@ -32,7 +32,6 @@
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
-import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.regex.Pattern;
 import java.util.stream.Collectors;
 
@@ -52,15 +51,8 @@ public MultiAwareBucketTableScan(
             Pattern includingPattern,
             Pattern excludingPattern,
             Pattern databasePattern,
-            boolean isStreaming,
-            AtomicBoolean isRunning) {
-        super(
-                catalogLoader,
-                includingPattern,
-                excludingPattern,
-                databasePattern,
-                isStreaming,
-                isRunning);
+            boolean isStreaming) {
+        super(catalogLoader, includingPattern, excludingPattern, databasePattern, isStreaming);
         tablesMap = new HashMap<>();
         scansMap = new HashMap<>();
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiTableScanBase.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiTableScanBase.java
index bd4ffe83a4ca0..f5940740b691c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiTableScanBase.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiTableScanBase.java
@@ -26,12 +26,11 @@
 import org.apache.paimon.table.source.EndOfScanException;
 import org.apache.paimon.table.source.Split;
 
-import org.apache.flink.streaming.api.functions.source.SourceFunction;
+import org.apache.flink.api.connector.source.ReaderOutput;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
 import java.util.List;
-import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.regex.Pattern;
 
 import static org.apache.paimon.flink.utils.MultiTablesCompactorUtil.shouldCompactTable;
@@ -57,7 +56,6 @@ public abstract class MultiTableScanBase<T> implements AutoCloseable {
 
     protected transient Catalog catalog;
 
-    protected AtomicBoolean isRunning;
     protected boolean isStreaming;
 
     public MultiTableScanBase(
@@ -65,14 +63,12 @@ public MultiTableScanBase(
             Pattern includingPattern,
             Pattern excludingPattern,
             Pattern databasePattern,
-            boolean isStreaming,
-            AtomicBoolean isRunning) {
+            boolean isStreaming) {
         catalog = catalogLoader.load();
 
         this.includingPattern = includingPattern;
         this.excludingPattern = excludingPattern;
         this.databasePattern = databasePattern;
-        this.isRunning = isRunning;
         this.isStreaming = isStreaming;
     }
 
@@ -104,13 +100,9 @@ protected void updateTableMap()
         }
     }
 
-    public ScanResult scanTable(SourceFunction.SourceContext<T> ctx)
+    public ScanResult scanTable(ReaderOutput<T> ctx)
             throws Catalog.TableNotExistException, Catalog.DatabaseNotExistException {
         try {
-            if (!isRunning.get()) {
-                return ScanResult.FINISHED;
-            }
-
             updateTableMap();
             List<T> tasks = doScan();
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiUnawareBucketTableScan.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiUnawareBucketTableScan.java
index 56bf971240e73..da86b93af5120 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiUnawareBucketTableScan.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/MultiUnawareBucketTableScan.java
@@ -29,7 +29,6 @@
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
-import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.regex.Pattern;
 
 /**
@@ -46,15 +45,8 @@ public MultiUnawareBucketTableScan(
             Pattern includingPattern,
             Pattern excludingPattern,
             Pattern databasePattern,
-            boolean isStreaming,
-            AtomicBoolean isRunning) {
-        super(
-                catalogLoader,
-                includingPattern,
-                excludingPattern,
-                databasePattern,
-                isStreaming,
-                isRunning);
+            boolean isStreaming) {
+        super(catalogLoader, includingPattern, excludingPattern, databasePattern, isStreaming);
         tablesMap = new HashMap<>();
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/UnawareBucketCompactionTopoBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/UnawareBucketCompactionTopoBuilder.java
index 8c6ed4c9f59e1..a572354e89845 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/UnawareBucketCompactionTopoBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/compact/UnawareBucketCompactionTopoBuilder.java
@@ -126,7 +126,7 @@ private DataStreamSource<UnawareAppendCompactionTask> buildSource() {
                 new BucketUnawareCompactSource(
                         table, isContinuous, scanInterval, partitionPredicate);
 
-        return BucketUnawareCompactSource.buildSource(env, source, isContinuous, tableIdentifier);
+        return BucketUnawareCompactSource.buildSource(env, source, tableIdentifier);
     }
 
     private void sinkFromSource(DataStreamSource<UnawareAppendCompactionTask> input) {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
index b9776786fa571..6688503778a0f 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/service/QueryFileMonitor.java
@@ -21,6 +21,9 @@
 import org.apache.paimon.CoreOptions;
 import org.apache.paimon.data.BinaryRow;
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 import org.apache.paimon.flink.utils.InternalTypeInfo;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.table.FileStoreTable;
@@ -31,11 +34,14 @@
 import org.apache.paimon.table.source.TableRead;
 import org.apache.paimon.table.system.FileMonitorTable;
 
-import org.apache.flink.api.common.functions.OpenContext;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
+import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -50,19 +56,13 @@
  *   <li>Assigning them to downstream tasks for further processing.
  * </ol>
  */
-public class QueryFileMonitor extends RichSourceFunction<InternalRow> {
+public class QueryFileMonitor extends AbstractNonCoordinatedSource<InternalRow> {
 
     private static final long serialVersionUID = 1L;
 
     private final Table table;
     private final long monitorInterval;
 
-    private transient SourceContext<InternalRow> ctx;
-    private transient StreamTableScan scan;
-    private transient TableRead read;
-
-    private volatile boolean isRunning = true;
-
     public QueryFileMonitor(Table table) {
         this.table = table;
         this.monitorInterval =
@@ -71,65 +71,54 @@ public QueryFileMonitor(Table table) {
                         .toMillis();
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public Boundedness getBoundedness() {
+        return Boundedness.CONTINUOUS_UNBOUNDED;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        FileMonitorTable monitorTable = new FileMonitorTable((FileStoreTable) table);
-        ReadBuilder readBuilder = monitorTable.newReadBuilder().dropStats();
-        this.scan = readBuilder.newStreamScan();
-        this.read = readBuilder.newRead();
+    @Override
+    public SourceReader<InternalRow, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
     }
 
-    @Override
-    public void run(SourceContext<InternalRow> ctx) throws Exception {
-        this.ctx = ctx;
-        while (isRunning) {
-            boolean isEmpty;
-            synchronized (ctx.getCheckpointLock()) {
-                if (!isRunning) {
-                    return;
-                }
-                isEmpty = doScan();
-            }
+    private class Reader extends AbstractNonCoordinatedSourceReader<InternalRow> {
+        private transient StreamTableScan scan;
+        private transient TableRead read;
+
+        @Override
+        public void start() {
+            FileMonitorTable monitorTable = new FileMonitorTable((FileStoreTable) table);
+            ReadBuilder readBuilder = monitorTable.newReadBuilder().dropStats();
+            this.scan = readBuilder.newStreamScan();
+            this.read = readBuilder.newRead();
+        }
+
+        @Override
+        public InputStatus pollNext(ReaderOutput<InternalRow> readerOutput) throws Exception {
+            boolean isEmpty = doScan(readerOutput);
 
             if (isEmpty) {
                 Thread.sleep(monitorInterval);
             }
+            return InputStatus.MORE_AVAILABLE;
         }
-    }
 
-    private boolean doScan() throws Exception {
-        List<InternalRow> records = new ArrayList<>();
-        read.createReader(scan.plan()).forEachRemaining(records::add);
-        records.forEach(ctx::collect);
-        return records.isEmpty();
-    }
-
-    @Override
-    public void cancel() {
-        // this is to cover the case where cancel() is called before the run()
-        if (ctx != null) {
-            synchronized (ctx.getCheckpointLock()) {
-                isRunning = false;
-            }
-        } else {
-            isRunning = false;
+        private boolean doScan(ReaderOutput<InternalRow> readerOutput) throws Exception {
+            List<InternalRow> records = new ArrayList<>();
+            read.createReader(scan.plan()).forEachRemaining(records::add);
+            records.forEach(readerOutput::collect);
+            return records.isEmpty();
         }
     }
 
     public static DataStream<InternalRow> build(StreamExecutionEnvironment env, Table table) {
-        return env.addSource(
-                new QueryFileMonitor(table),
-                "FileMonitor-" + table.name(),
-                InternalTypeInfo.fromRowType(FileMonitorTable.getRowType()));
+        return env.fromSource(
+                        new QueryFileMonitor(table),
+                        WatermarkStrategy.noWatermarks(),
+                        "FileMonitor-" + table.name(),
+                        InternalTypeInfo.fromRowType(FileMonitorTable.getRowType()))
+                .setParallelism(1);
     }
 
     public static ChannelComputer<InternalRow> createChannelComputer() {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSource.java
new file mode 100644
index 0000000000000..a9a389e837a21
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSource.java
@@ -0,0 +1,50 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.api.connector.source.Source;
+import org.apache.flink.api.connector.source.SplitEnumerator;
+import org.apache.flink.api.connector.source.SplitEnumeratorContext;
+import org.apache.flink.core.io.SimpleVersionedSerializer;
+
+/** {@link Source} that does not require coordination between JobManager and TaskManagers. */
+public abstract class AbstractNonCoordinatedSource<T>
+        implements Source<T, SimpleSourceSplit, NoOpEnumState> {
+    @Override
+    public SplitEnumerator<SimpleSourceSplit, NoOpEnumState> createEnumerator(
+            SplitEnumeratorContext<SimpleSourceSplit> enumContext) {
+        return new NoOpEnumerator<>();
+    }
+
+    @Override
+    public SplitEnumerator<SimpleSourceSplit, NoOpEnumState> restoreEnumerator(
+            SplitEnumeratorContext<SimpleSourceSplit> enumContext, NoOpEnumState checkpoint) {
+        return new NoOpEnumerator<>();
+    }
+
+    @Override
+    public SimpleVersionedSerializer<SimpleSourceSplit> getSplitSerializer() {
+        return new SimpleSourceSplitSerializer();
+    }
+
+    @Override
+    public SimpleVersionedSerializer<NoOpEnumState> getEnumeratorCheckpointSerializer() {
+        return new NoOpEnumStateSerializer();
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSourceReader.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSourceReader.java
new file mode 100644
index 0000000000000..18c278868ffae
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/AbstractNonCoordinatedSourceReader.java
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.api.connector.source.SourceReader;
+
+import java.util.Collections;
+import java.util.List;
+import java.util.concurrent.CompletableFuture;
+
+/** Abstract {@link SourceReader} for {@link AbstractNonCoordinatedSource}. */
+public abstract class AbstractNonCoordinatedSourceReader<T>
+        implements SourceReader<T, SimpleSourceSplit> {
+    @Override
+    public void start() {}
+
+    @Override
+    public List<SimpleSourceSplit> snapshotState(long l) {
+        return Collections.emptyList();
+    }
+
+    @Override
+    public CompletableFuture<Void> isAvailable() {
+        return CompletableFuture.completedFuture(null);
+    }
+
+    @Override
+    public void addSplits(List<SimpleSourceSplit> list) {}
+
+    @Override
+    public void notifyNoMoreSplits() {}
+
+    @Override
+    public void close() throws Exception {}
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
index 79ee827fe6e41..7954aad2df0a4 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/BucketUnawareCompactSource.java
@@ -21,19 +21,19 @@
 import org.apache.paimon.append.UnawareAppendCompactionTask;
 import org.apache.paimon.append.UnawareAppendTableCompactionCoordinator;
 import org.apache.paimon.flink.sink.CompactionTaskTypeInfo;
-import org.apache.paimon.flink.utils.RuntimeContextUtils;
 import org.apache.paimon.predicate.Predicate;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.source.EndOfScanException;
-import org.apache.paimon.utils.Preconditions;
 
-import org.apache.flink.api.common.functions.OpenContext;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.connector.source.Boundedness;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
-import org.apache.flink.streaming.api.operators.StreamSource;
+import org.apache.flink.util.Preconditions;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
@@ -42,15 +42,16 @@
 import java.util.List;
 
 /**
- * Source Function for unaware-bucket Compaction.
+ * Source for unaware-bucket Compaction.
  *
- * <p>Note: The function is the source function of unaware-bucket compactor coordinator. It will
- * read the latest snapshot continuously by compactionCoordinator, and generate new compaction
- * tasks. The source function is used in unaware-bucket compaction job (both stand-alone and
- * write-combined). Besides, we don't need to save state in this function, it will invoke a full
- * scan when starting up, and scan continuously for the following snapshot.
+ * <p>Note: The function is the source of unaware-bucket compactor coordinator. It will read the
+ * latest snapshot continuously by compactionCoordinator, and generate new compaction tasks. The
+ * source is used in unaware-bucket compaction job (both stand-alone and write-combined). Besides,
+ * we don't need to save state in this source, it will invoke a full scan when starting up, and scan
+ * continuously for the following snapshot.
  */
-public class BucketUnawareCompactSource extends RichSourceFunction<UnawareAppendCompactionTask> {
+public class BucketUnawareCompactSource
+        extends AbstractNonCoordinatedSource<UnawareAppendCompactionTask> {
 
     private static final Logger LOG = LoggerFactory.getLogger(BucketUnawareCompactSource.class);
     private static final String COMPACTION_COORDINATOR_NAME = "Compaction Coordinator";
@@ -59,9 +60,6 @@ public class BucketUnawareCompactSource extends RichSourceFunction<UnawareAppend
     private final boolean streaming;
     private final long scanInterval;
     private final Predicate filter;
-    private transient UnawareAppendTableCompactionCoordinator compactionCoordinator;
-    private transient SourceContext<UnawareAppendCompactionTask> ctx;
-    private volatile boolean isRunning = true;
 
     public BucketUnawareCompactSource(
             FileStoreTable table,
@@ -74,76 +72,64 @@ public BucketUnawareCompactSource(
         this.filter = filter;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public Boundedness getBoundedness() {
+        return streaming ? Boundedness.CONTINUOUS_UNBOUNDED : Boundedness.BOUNDED;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        compactionCoordinator =
-                new UnawareAppendTableCompactionCoordinator(table, streaming, filter);
+    @Override
+    public SourceReader<UnawareAppendCompactionTask, SimpleSourceSplit> createReader(
+            SourceReaderContext readerContext) throws Exception {
         Preconditions.checkArgument(
-                RuntimeContextUtils.getNumberOfParallelSubtasks(getRuntimeContext()) == 1,
+                readerContext.currentParallelism() == 1,
                 "Compaction Operator parallelism in paimon MUST be one.");
+        return new BucketUnawareCompactSourceReader(table, streaming, filter, scanInterval);
     }
 
-    @Override
-    public void run(SourceContext<UnawareAppendCompactionTask> sourceContext) throws Exception {
-        this.ctx = sourceContext;
-        while (isRunning) {
+    /** BucketUnawareCompactSourceReader. */
+    public static class BucketUnawareCompactSourceReader
+            extends AbstractNonCoordinatedSourceReader<UnawareAppendCompactionTask> {
+        private final UnawareAppendTableCompactionCoordinator compactionCoordinator;
+        private final long scanInterval;
+
+        public BucketUnawareCompactSourceReader(
+                FileStoreTable table, boolean streaming, Predicate filter, long scanInterval) {
+            this.scanInterval = scanInterval;
+            compactionCoordinator =
+                    new UnawareAppendTableCompactionCoordinator(table, streaming, filter);
+        }
+
+        @Override
+        public InputStatus pollNext(ReaderOutput<UnawareAppendCompactionTask> readerOutput)
+                throws Exception {
             boolean isEmpty;
-            synchronized (ctx.getCheckpointLock()) {
-                if (!isRunning) {
-                    return;
-                }
-                try {
-                    // do scan and plan action, emit append-only compaction tasks.
-                    List<UnawareAppendCompactionTask> tasks = compactionCoordinator.run();
-                    isEmpty = tasks.isEmpty();
-                    tasks.forEach(ctx::collect);
-                } catch (EndOfScanException esf) {
-                    LOG.info("Catching EndOfStreamException, the stream is finished.");
-                    return;
-                }
+            try {
+                // do scan and plan action, emit append-only compaction tasks.
+                List<UnawareAppendCompactionTask> tasks = compactionCoordinator.run();
+                isEmpty = tasks.isEmpty();
+                tasks.forEach(readerOutput::collect);
+            } catch (EndOfScanException esf) {
+                LOG.info("Catching EndOfStreamException, the stream is finished.");
+                return InputStatus.END_OF_INPUT;
             }
 
             if (isEmpty) {
                 Thread.sleep(scanInterval);
             }
-        }
-    }
-
-    @Override
-    public void cancel() {
-        if (ctx != null) {
-            synchronized (ctx.getCheckpointLock()) {
-                isRunning = false;
-            }
-        } else {
-            isRunning = false;
+            return InputStatus.MORE_AVAILABLE;
         }
     }
 
     public static DataStreamSource<UnawareAppendCompactionTask> buildSource(
             StreamExecutionEnvironment env,
             BucketUnawareCompactSource source,
-            boolean streaming,
             String tableIdentifier) {
-        final StreamSource<UnawareAppendCompactionTask, BucketUnawareCompactSource> sourceOperator =
-                new StreamSource<>(source);
         return (DataStreamSource<UnawareAppendCompactionTask>)
-                new DataStreamSource<>(
-                                env,
-                                new CompactionTaskTypeInfo(),
-                                sourceOperator,
-                                false,
+                env.fromSource(
+                                source,
+                                WatermarkStrategy.noWatermarks(),
                                 COMPACTION_COORDINATOR_NAME + " : " + tableIdentifier,
-                                streaming ? Boundedness.CONTINUOUS_UNBOUNDED : Boundedness.BOUNDED)
+                                new CompactionTaskTypeInfo())
                         .setParallelism(1)
                         .setMaxParallelism(1);
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/CombinedTableCompactorSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/CombinedTableCompactorSourceBuilder.java
index e5cbbe845ceb0..415eddb037dfe 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/CombinedTableCompactorSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/CombinedTableCompactorSourceBuilder.java
@@ -21,10 +21,10 @@
 import org.apache.paimon.append.MultiTableUnawareAppendCompactionTask;
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.flink.LogicalTypeConversion;
-import org.apache.paimon.flink.source.operator.CombinedAwareBatchSourceFunction;
-import org.apache.paimon.flink.source.operator.CombinedAwareStreamingSourceFunction;
-import org.apache.paimon.flink.source.operator.CombinedUnawareBatchSourceFunction;
-import org.apache.paimon.flink.source.operator.CombinedUnawareStreamingSourceFunction;
+import org.apache.paimon.flink.source.operator.CombinedAwareBatchSource;
+import org.apache.paimon.flink.source.operator.CombinedAwareStreamingSource;
+import org.apache.paimon.flink.source.operator.CombinedUnawareBatchSource;
+import org.apache.paimon.flink.source.operator.CombinedUnawareStreamingSource;
 import org.apache.paimon.table.system.CompactBucketsTable;
 import org.apache.paimon.types.RowType;
 import org.apache.paimon.utils.Preconditions;
@@ -87,7 +87,7 @@ public DataStream<RowData> buildAwareBucketTableSource() {
         Preconditions.checkArgument(env != null, "StreamExecutionEnvironment should not be null.");
         RowType produceType = CompactBucketsTable.getRowType();
         if (isContinuous) {
-            return CombinedAwareStreamingSourceFunction.buildSource(
+            return CombinedAwareStreamingSource.buildSource(
                     env,
                     "Combine-MultiBucketTables--StreamingCompactorSource",
                     InternalTypeInfo.of(LogicalTypeConversion.toLogicalType(produceType)),
@@ -97,7 +97,7 @@ public DataStream<RowData> buildAwareBucketTableSource() {
                     databasePattern,
                     monitorInterval);
         } else {
-            return CombinedAwareBatchSourceFunction.buildSource(
+            return CombinedAwareBatchSource.buildSource(
                     env,
                     "Combine-MultiBucketTables-BatchCompactorSource",
                     InternalTypeInfo.of(LogicalTypeConversion.toLogicalType(produceType)),
@@ -112,7 +112,7 @@ public DataStream<RowData> buildAwareBucketTableSource() {
     public DataStream<MultiTableUnawareAppendCompactionTask> buildForUnawareBucketsTableSource() {
         Preconditions.checkArgument(env != null, "StreamExecutionEnvironment should not be null.");
         if (isContinuous) {
-            return CombinedUnawareStreamingSourceFunction.buildSource(
+            return CombinedUnawareStreamingSource.buildSource(
                     env,
                     "Combined-UnawareBucketTables-StreamingCompactorSource",
                     catalogLoader,
@@ -121,7 +121,7 @@ public DataStream<MultiTableUnawareAppendCompactionTask> buildForUnawareBucketsT
                     databasePattern,
                     monitorInterval);
         } else {
-            return CombinedUnawareBatchSourceFunction.buildSource(
+            return CombinedUnawareBatchSource.buildSource(
                     env,
                     "Combined-UnawareBucketTables-BatchCompactorSource",
                     catalogLoader,
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
index e864ec0500459..b85d5274b241c 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/FlinkSourceBuilder.java
@@ -26,7 +26,7 @@
 import org.apache.paimon.flink.log.LogSourceProvider;
 import org.apache.paimon.flink.sink.FlinkSink;
 import org.apache.paimon.flink.source.align.AlignedContinuousFileStoreSource;
-import org.apache.paimon.flink.source.operator.MonitorFunction;
+import org.apache.paimon.flink.source.operator.MonitorSource;
 import org.apache.paimon.flink.utils.TableScanUtils;
 import org.apache.paimon.options.Options;
 import org.apache.paimon.predicate.Predicate;
@@ -306,7 +306,7 @@ private DataStream<RowData> buildContinuousStreamOperator() {
                     "Cannot limit streaming source, please use batch execution mode.");
         }
         dataStream =
-                MonitorFunction.buildSource(
+                MonitorSource.buildSource(
                         env,
                         sourceName,
                         produceTypeInfo(),
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumState.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumState.java
new file mode 100644
index 0000000000000..f07317c155aa5
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumState.java
@@ -0,0 +1,22 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+/** The enumerator state class for {@link NoOpEnumerator}. */
+public class NoOpEnumState {}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumStateSerializer.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumStateSerializer.java
new file mode 100644
index 0000000000000..89c0ad6ac1f10
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumStateSerializer.java
@@ -0,0 +1,41 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.core.io.SimpleVersionedSerializer;
+
+import java.io.IOException;
+
+/** {@link SimpleVersionedSerializer} for {@link NoOpEnumState}. */
+public class NoOpEnumStateSerializer implements SimpleVersionedSerializer<NoOpEnumState> {
+    @Override
+    public int getVersion() {
+        return 0;
+    }
+
+    @Override
+    public byte[] serialize(NoOpEnumState obj) throws IOException {
+        return new byte[0];
+    }
+
+    @Override
+    public NoOpEnumState deserialize(int version, byte[] serialized) throws IOException {
+        return new NoOpEnumState();
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumerator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumerator.java
new file mode 100644
index 0000000000000..f29c6d6db76dd
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/NoOpEnumerator.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.api.connector.source.SourceSplit;
+import org.apache.flink.api.connector.source.SplitEnumerator;
+
+import javax.annotation.Nullable;
+
+import java.io.IOException;
+import java.util.List;
+
+/**
+ * A {@link SplitEnumerator} that provides no functionality. It is basically used for sources that
+ * does not require a coordinator.
+ */
+public class NoOpEnumerator<SplitT extends SourceSplit>
+        implements SplitEnumerator<SplitT, NoOpEnumState> {
+    @Override
+    public void start() {}
+
+    @Override
+    public void handleSplitRequest(int subtaskId, @Nullable String requesterHostname) {}
+
+    @Override
+    public void addSplitsBack(List<SplitT> splits, int subtaskId) {}
+
+    @Override
+    public void addReader(int subtaskId) {}
+
+    @Override
+    public NoOpEnumState snapshotState(long checkpointId) throws Exception {
+        return new NoOpEnumState();
+    }
+
+    @Override
+    public void close() throws IOException {}
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplit.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplit.java
new file mode 100644
index 0000000000000..2db0868f8e34a
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplit.java
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.api.connector.source.SourceSplit;
+
+import java.util.UUID;
+
+/** A {@link SourceSplit} that provides basic information through splitId. */
+public class SimpleSourceSplit implements SourceSplit {
+    private final String splitId;
+    private final String value;
+
+    public SimpleSourceSplit() {
+        this("");
+    }
+
+    public SimpleSourceSplit(String value) {
+        this(UUID.randomUUID().toString(), value);
+    }
+
+    public SimpleSourceSplit(String splitId, String value) {
+        this.splitId = splitId;
+        this.value = value;
+    }
+
+    @Override
+    public String splitId() {
+        return splitId;
+    }
+
+    public String value() {
+        return value;
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplitSerializer.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplitSerializer.java
new file mode 100644
index 0000000000000..3387afed1c2a8
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SimpleSourceSplitSerializer.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.flink.core.io.SimpleVersionedSerializer;
+
+import java.io.ByteArrayInputStream;
+import java.io.ByteArrayOutputStream;
+import java.io.DataInputStream;
+import java.io.DataOutputStream;
+import java.io.IOException;
+
+/** {@link SimpleVersionedSerializer} for {@link SimpleSourceSplit}. */
+public class SimpleSourceSplitSerializer implements SimpleVersionedSerializer<SimpleSourceSplit> {
+
+    @Override
+    public int getVersion() {
+        return 0;
+    }
+
+    @Override
+    public byte[] serialize(SimpleSourceSplit split) throws IOException {
+        if (split.splitId() == null) {
+            return new byte[0];
+        }
+
+        try (final ByteArrayOutputStream baos = new ByteArrayOutputStream();
+                final DataOutputStream out = new DataOutputStream(baos)) {
+            writeString(out, split.splitId());
+            writeString(out, split.value());
+            return baos.toByteArray();
+        }
+    }
+
+    @Override
+    public SimpleSourceSplit deserialize(int version, byte[] serialized) throws IOException {
+        if (serialized.length == 0) {
+            return new SimpleSourceSplit();
+        }
+
+        try (final ByteArrayInputStream bais = new ByteArrayInputStream(serialized);
+                final DataInputStream in = new DataInputStream(bais)) {
+            String splitId = readString(in);
+            String value = readString(in);
+            return new SimpleSourceSplit(splitId, value);
+        }
+    }
+
+    private void writeString(DataOutputStream out, String str) throws IOException {
+        byte[] bytes = str.getBytes();
+        out.writeInt(bytes.length);
+        out.write(str.getBytes());
+    }
+
+    private String readString(DataInputStream in) throws IOException {
+        int length = in.readInt();
+        byte[] bytes = new byte[length];
+        in.readFully(bytes);
+        return new String(bytes);
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SplitListState.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SplitListState.java
new file mode 100644
index 0000000000000..0049bdf284e35
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/SplitListState.java
@@ -0,0 +1,92 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source;
+
+import org.apache.paimon.utils.Preconditions;
+
+import org.apache.flink.api.common.state.ListState;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+
+/**
+ * Utility class to provide {@link ListState}-like experience for sources that use {@link
+ * SimpleSourceSplit}.
+ */
+public class SplitListState<T> implements ListState<T> {
+    private final String splitPrefix;
+    private final List<T> values;
+    private final Function<T, String> serializer;
+    private final Function<String, T> deserializer;
+
+    public SplitListState(
+            String identifier, Function<T, String> serializer, Function<String, T> deserializer) {
+        Preconditions.checkArgument(
+                !Character.isDigit(identifier.charAt(0)),
+                String.format("Identifier %s should not start with digits.", identifier));
+        this.splitPrefix = identifier.length() + identifier;
+        this.serializer = serializer;
+        this.deserializer = deserializer;
+        this.values = new ArrayList<>();
+    }
+
+    @Override
+    public void add(T value) {
+        values.add(value);
+    }
+
+    @Override
+    public List<T> get() {
+        return new ArrayList<>(values);
+    }
+
+    @Override
+    public void update(List<T> values) {
+        this.values.clear();
+        this.values.addAll(values);
+    }
+
+    @Override
+    public void addAll(List<T> values) throws Exception {
+        this.values.addAll(values);
+    }
+
+    @Override
+    public void clear() {
+        values.clear();
+    }
+
+    public List<SimpleSourceSplit> snapshotState() {
+        return values.stream()
+                .map(x -> new SimpleSourceSplit(splitPrefix + serializer.apply(x)))
+                .collect(Collectors.toList());
+    }
+
+    public void restoreState(List<SimpleSourceSplit> splits) {
+        values.clear();
+        splits.stream()
+                .map(SimpleSourceSplit::value)
+                .filter(x -> x.startsWith(splitPrefix))
+                .map(x -> x.substring(splitPrefix.length()))
+                .map(this.deserializer)
+                .forEach(values::add);
+    }
+}
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSource.java
similarity index 66%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSource.java
index 2157be51aee4d..c3a1258bb176e 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareBatchSource.java
@@ -21,21 +21,23 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.flink.compact.MultiAwareBucketTableScan;
 import org.apache.paimon.flink.compact.MultiTableScanBase;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 import org.apache.paimon.flink.utils.JavaTypeInfo;
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.table.source.Split;
 
-import org.apache.flink.api.common.functions.OpenContext;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
-import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.api.java.typeutils.TupleTypeInfo;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.operators.StreamSource;
 import org.apache.flink.table.data.RowData;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -47,15 +49,11 @@
 import static org.apache.paimon.flink.compact.MultiTableScanBase.ScanResult.IS_EMPTY;
 
 /** It is responsible for monitoring compactor source of aware bucket table in batch mode. */
-public class CombinedAwareBatchSourceFunction
-        extends CombinedCompactorSourceFunction<Tuple2<Split, String>> {
+public class CombinedAwareBatchSource extends CombinedCompactorSource<Tuple2<Split, String>> {
 
-    private static final Logger LOGGER =
-            LoggerFactory.getLogger(CombinedAwareBatchSourceFunction.class);
+    private static final Logger LOGGER = LoggerFactory.getLogger(CombinedAwareBatchSource.class);
 
-    private MultiTableScanBase<Tuple2<Split, String>> tableScan;
-
-    public CombinedAwareBatchSourceFunction(
+    public CombinedAwareBatchSource(
             Catalog.Loader catalogLoader,
             Pattern includingPattern,
             Pattern excludingPattern,
@@ -63,34 +61,33 @@ public CombinedAwareBatchSourceFunction(
         super(catalogLoader, includingPattern, excludingPattern, databasePattern, false);
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public SourceReader<Tuple2<Split, String>, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        super.open(parameters);
-        tableScan =
-                new MultiAwareBucketTableScan(
-                        catalogLoader,
-                        includingPattern,
-                        excludingPattern,
-                        databasePattern,
-                        isStreaming,
-                        isRunning);
-    }
+    private class Reader extends AbstractNonCoordinatedSourceReader<Tuple2<Split, String>> {
+        private MultiTableScanBase<Tuple2<Split, String>> tableScan;
 
-    @Override
-    void scanTable() throws Exception {
-        if (isRunning.get()) {
-            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(ctx);
+        @Override
+        public void start() {
+            super.start();
+            tableScan =
+                    new MultiAwareBucketTableScan(
+                            catalogLoader,
+                            includingPattern,
+                            excludingPattern,
+                            databasePattern,
+                            isStreaming);
+        }
+
+        @Override
+        public InputStatus pollNext(ReaderOutput<Tuple2<Split, String>> readerOutput)
+                throws Exception {
+            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(readerOutput);
             if (scanResult == FINISHED) {
-                return;
+                return InputStatus.END_OF_INPUT;
             }
             if (scanResult == IS_EMPTY) {
                 // Currently, in the combined mode, there are two scan tasks for the table of two
@@ -99,6 +96,15 @@ void scanTable() throws Exception {
                 // should not be thrown exception here.
                 LOGGER.info("No file were collected for the table of aware-bucket");
             }
+            return InputStatus.END_OF_INPUT;
+        }
+
+        @Override
+        public void close() throws Exception {
+            super.close();
+            if (tableScan != null) {
+                tableScan.close();
+            }
         }
     }
 
@@ -111,15 +117,14 @@ public static DataStream<RowData> buildSource(
             Pattern excludingPattern,
             Pattern databasePattern,
             Duration partitionIdleTime) {
-        CombinedAwareBatchSourceFunction function =
-                new CombinedAwareBatchSourceFunction(
+        CombinedAwareBatchSource source =
+                new CombinedAwareBatchSource(
                         catalogLoader, includingPattern, excludingPattern, databasePattern);
-        StreamSource<Tuple2<Split, String>, ?> sourceOperator = new StreamSource<>(function);
         TupleTypeInfo<Tuple2<Split, String>> tupleTypeInfo =
                 new TupleTypeInfo<>(
                         new JavaTypeInfo<>(Split.class), BasicTypeInfo.STRING_TYPE_INFO);
-        return new DataStreamSource<>(
-                        env, tupleTypeInfo, sourceOperator, false, name, Boundedness.BOUNDED)
+
+        return env.fromSource(source, WatermarkStrategy.noWatermarks(), name, tupleTypeInfo)
                 .forceNonParallel()
                 .partitionCustom(
                         (key, numPartitions) -> key % numPartitions,
@@ -129,12 +134,4 @@ public static DataStream<RowData> buildSource(
                         typeInfo,
                         new MultiTablesReadOperator(catalogLoader, false, partitionIdleTime));
     }
-
-    @Override
-    public void close() throws Exception {
-        super.close();
-        if (tableScan != null) {
-            tableScan.close();
-        }
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSource.java
similarity index 63%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSource.java
index 01e0127e9fda7..9bd4a84f571c3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedAwareStreamingSource.java
@@ -21,21 +21,23 @@
 import org.apache.paimon.catalog.Catalog;
 import org.apache.paimon.flink.compact.MultiAwareBucketTableScan;
 import org.apache.paimon.flink.compact.MultiTableScanBase;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 import org.apache.paimon.flink.utils.JavaTypeInfo;
 import org.apache.paimon.table.source.DataSplit;
 import org.apache.paimon.table.source.Split;
 
-import org.apache.flink.api.common.functions.OpenContext;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.common.typeinfo.BasicTypeInfo;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
-import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
 import org.apache.flink.api.java.tuple.Tuple2;
 import org.apache.flink.api.java.typeutils.TupleTypeInfo;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.operators.StreamSource;
 import org.apache.flink.table.data.RowData;
 
 import java.util.regex.Pattern;
@@ -44,13 +46,11 @@
 import static org.apache.paimon.flink.compact.MultiTableScanBase.ScanResult.IS_EMPTY;
 
 /** It is responsible for monitoring compactor source of multi bucket table in stream mode. */
-public class CombinedAwareStreamingSourceFunction
-        extends CombinedCompactorSourceFunction<Tuple2<Split, String>> {
+public class CombinedAwareStreamingSource extends CombinedCompactorSource<Tuple2<Split, String>> {
 
     private final long monitorInterval;
-    private transient MultiTableScanBase<Tuple2<Split, String>> tableScan;
 
-    public CombinedAwareStreamingSourceFunction(
+    public CombinedAwareStreamingSource(
             Catalog.Loader catalogLoader,
             Pattern includingPattern,
             Pattern excludingPattern,
@@ -60,39 +60,46 @@ public CombinedAwareStreamingSourceFunction(
         this.monitorInterval = monitorInterval;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public SourceReader<Tuple2<Split, String>, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        super.open(parameters);
-        tableScan =
-                new MultiAwareBucketTableScan(
-                        catalogLoader,
-                        includingPattern,
-                        excludingPattern,
-                        databasePattern,
-                        isStreaming,
-                        isRunning);
-    }
+    private class Reader extends AbstractNonCoordinatedSourceReader<Tuple2<Split, String>> {
+        private transient MultiTableScanBase<Tuple2<Split, String>> tableScan;
 
-    @SuppressWarnings("BusyWait")
-    @Override
-    void scanTable() throws Exception {
-        while (isRunning.get()) {
-            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(ctx);
+        @Override
+        public void start() {
+            super.start();
+            tableScan =
+                    new MultiAwareBucketTableScan(
+                            catalogLoader,
+                            includingPattern,
+                            excludingPattern,
+                            databasePattern,
+                            isStreaming);
+        }
+
+        @Override
+        public InputStatus pollNext(ReaderOutput<Tuple2<Split, String>> readerOutput)
+                throws Exception {
+            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(readerOutput);
             if (scanResult == FINISHED) {
-                return;
+                return InputStatus.END_OF_INPUT;
             }
             if (scanResult == IS_EMPTY) {
                 Thread.sleep(monitorInterval);
             }
+            return InputStatus.MORE_AVAILABLE;
+        }
+
+        @Override
+        public void close() throws Exception {
+            super.close();
+            if (tableScan != null) {
+                tableScan.close();
+            }
         }
     }
 
@@ -106,37 +113,22 @@ public static DataStream<RowData> buildSource(
             Pattern databasePattern,
             long monitorInterval) {
 
-        CombinedAwareStreamingSourceFunction function =
-                new CombinedAwareStreamingSourceFunction(
+        CombinedAwareStreamingSource source =
+                new CombinedAwareStreamingSource(
                         catalogLoader,
                         includingPattern,
                         excludingPattern,
                         databasePattern,
                         monitorInterval);
-        StreamSource<Tuple2<Split, String>, ?> sourceOperator = new StreamSource<>(function);
-        boolean isParallel = false;
         TupleTypeInfo<Tuple2<Split, String>> tupleTypeInfo =
                 new TupleTypeInfo<>(
                         new JavaTypeInfo<>(Split.class), BasicTypeInfo.STRING_TYPE_INFO);
-        return new DataStreamSource<>(
-                        env,
-                        tupleTypeInfo,
-                        sourceOperator,
-                        isParallel,
-                        name,
-                        Boundedness.CONTINUOUS_UNBOUNDED)
+
+        return env.fromSource(source, WatermarkStrategy.noWatermarks(), name, tupleTypeInfo)
                 .forceNonParallel()
                 .partitionCustom(
                         (key, numPartitions) -> key % numPartitions,
                         split -> ((DataSplit) split.f0).bucket())
                 .transform(name, typeInfo, new MultiTablesReadOperator(catalogLoader, true));
     }
-
-    @Override
-    public void close() throws Exception {
-        super.close();
-        if (tableScan != null) {
-            tableScan.close();
-        }
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSource.java
similarity index 63%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSource.java
index 02bb8786505db..f58d86cdd65eb 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedCompactorSource.java
@@ -20,13 +20,11 @@
 
 import org.apache.paimon.append.UnawareAppendCompactionTask;
 import org.apache.paimon.catalog.Catalog;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
 import org.apache.paimon.table.source.Split;
 
-import org.apache.flink.api.common.functions.OpenContext;
-import org.apache.flink.configuration.Configuration;
-import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
+import org.apache.flink.api.connector.source.Boundedness;
 
-import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.regex.Pattern;
 
 /**
@@ -45,8 +43,7 @@
  * <p>Currently, only dedicated compaction job for multi-tables rely on this monitor. This is the
  * single (non-parallel) monitoring task, it is responsible for the new Paimon table.
  */
-public abstract class CombinedCompactorSourceFunction<T> extends RichSourceFunction<T> {
-
+public abstract class CombinedCompactorSource<T> extends AbstractNonCoordinatedSource<T> {
     private static final long serialVersionUID = 2L;
 
     protected final Catalog.Loader catalogLoader;
@@ -55,10 +52,7 @@ public abstract class CombinedCompactorSourceFunction<T> extends RichSourceFunct
     protected final Pattern databasePattern;
     protected final boolean isStreaming;
 
-    protected transient AtomicBoolean isRunning;
-    protected transient SourceContext<T> ctx;
-
-    public CombinedCompactorSourceFunction(
+    public CombinedCompactorSource(
             Catalog.Loader catalogLoader,
             Pattern includingPattern,
             Pattern excludingPattern,
@@ -71,37 +65,8 @@ public CombinedCompactorSourceFunction(
         this.isStreaming = isStreaming;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
-    }
-
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        isRunning = new AtomicBoolean(true);
-    }
-
     @Override
-    public void run(SourceContext<T> sourceContext) throws Exception {
-        this.ctx = sourceContext;
-        scanTable();
+    public Boundedness getBoundedness() {
+        return isStreaming ? Boundedness.CONTINUOUS_UNBOUNDED : Boundedness.BOUNDED;
     }
-
-    @Override
-    public void cancel() {
-        // this is to cover the case where cancel() is called before the run()
-        if (ctx != null) {
-            synchronized (ctx.getCheckpointLock()) {
-                isRunning.set(false);
-            }
-        } else {
-            isRunning.set(false);
-        }
-    }
-
-    abstract void scanTable() throws Exception;
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSource.java
similarity index 71%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSource.java
index 6a40f10ada615..64f0c38f5a11d 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareBatchSource.java
@@ -25,18 +25,20 @@
 import org.apache.paimon.flink.compact.MultiTableScanBase;
 import org.apache.paimon.flink.compact.MultiUnawareBucketTableScan;
 import org.apache.paimon.flink.sink.MultiTableCompactionTaskTypeInfo;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 import org.apache.paimon.manifest.PartitionEntry;
 import org.apache.paimon.table.FileStoreTable;
 import org.apache.paimon.table.Table;
 
-import org.apache.flink.api.common.functions.OpenContext;
-import org.apache.flink.api.connector.source.Boundedness;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.operators.StreamSource;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
@@ -55,14 +57,12 @@
  * It is responsible for the batch compactor source of the table with unaware bucket in combined
  * mode.
  */
-public class CombinedUnawareBatchSourceFunction
-        extends CombinedCompactorSourceFunction<MultiTableUnawareAppendCompactionTask> {
+public class CombinedUnawareBatchSource
+        extends CombinedCompactorSource<MultiTableUnawareAppendCompactionTask> {
 
-    private static final Logger LOGGER =
-            LoggerFactory.getLogger(CombinedUnawareBatchSourceFunction.class);
-    private transient MultiTableScanBase<MultiTableUnawareAppendCompactionTask> tableScan;
+    private static final Logger LOGGER = LoggerFactory.getLogger(CombinedUnawareBatchSource.class);
 
-    public CombinedUnawareBatchSourceFunction(
+    public CombinedUnawareBatchSource(
             Catalog.Loader catalogLoader,
             Pattern includingPattern,
             Pattern excludingPattern,
@@ -70,34 +70,34 @@ public CombinedUnawareBatchSourceFunction(
         super(catalogLoader, includingPattern, excludingPattern, databasePattern, false);
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public SourceReader<MultiTableUnawareAppendCompactionTask, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        super.open(parameters);
-        tableScan =
-                new MultiUnawareBucketTableScan(
-                        catalogLoader,
-                        includingPattern,
-                        excludingPattern,
-                        databasePattern,
-                        isStreaming,
-                        isRunning);
-    }
+    private class Reader
+            extends AbstractNonCoordinatedSourceReader<MultiTableUnawareAppendCompactionTask> {
+        private transient MultiTableScanBase<MultiTableUnawareAppendCompactionTask> tableScan;
+
+        @Override
+        public void start() {
+            super.start();
+            tableScan =
+                    new MultiUnawareBucketTableScan(
+                            catalogLoader,
+                            includingPattern,
+                            excludingPattern,
+                            databasePattern,
+                            isStreaming);
+        }
 
-    @Override
-    void scanTable() throws Exception {
-        if (isRunning.get()) {
-            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(ctx);
+        @Override
+        public InputStatus pollNext(
+                ReaderOutput<MultiTableUnawareAppendCompactionTask> readerOutput) throws Exception {
+            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(readerOutput);
             if (scanResult == FINISHED) {
-                return;
+                return InputStatus.END_OF_INPUT;
             }
             if (scanResult == IS_EMPTY) {
                 // Currently, in the combined mode, there are two scan tasks for the table of two
@@ -106,6 +106,15 @@ void scanTable() throws Exception {
                 // should not be thrown exception here.
                 LOGGER.info("No file were collected for the table of unaware-bucket");
             }
+            return InputStatus.END_OF_INPUT;
+        }
+
+        @Override
+        public void close() throws Exception {
+            super.close();
+            if (tableScan != null) {
+                tableScan.close();
+            }
         }
     }
 
@@ -117,22 +126,18 @@ public static DataStream<MultiTableUnawareAppendCompactionTask> buildSource(
             Pattern excludingPattern,
             Pattern databasePattern,
             @Nullable Duration partitionIdleTime) {
-        CombinedUnawareBatchSourceFunction function =
-                new CombinedUnawareBatchSourceFunction(
+        CombinedUnawareBatchSource combinedUnawareBatchSource =
+                new CombinedUnawareBatchSource(
                         catalogLoader, includingPattern, excludingPattern, databasePattern);
-        StreamSource<MultiTableUnawareAppendCompactionTask, CombinedUnawareBatchSourceFunction>
-                sourceOperator = new StreamSource<>(function);
         MultiTableCompactionTaskTypeInfo compactionTaskTypeInfo =
                 new MultiTableCompactionTaskTypeInfo();
 
         SingleOutputStreamOperator<MultiTableUnawareAppendCompactionTask> source =
-                new DataStreamSource<>(
-                                env,
-                                compactionTaskTypeInfo,
-                                sourceOperator,
-                                false,
+                env.fromSource(
+                                combinedUnawareBatchSource,
+                                WatermarkStrategy.noWatermarks(),
                                 name,
-                                Boundedness.BOUNDED)
+                                compactionTaskTypeInfo)
                         .forceNonParallel();
 
         if (partitionIdleTime != null) {
@@ -177,12 +182,4 @@ private static Long getPartitionInfo(
         }
         return partitionInfo.get(partition);
     }
-
-    @Override
-    public void close() throws Exception {
-        super.close();
-        if (tableScan != null) {
-            tableScan.close();
-        }
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSource.java
similarity index 57%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSource.java
index b64518a7ef60a..6ea1ead4db301 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSourceFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/CombinedUnawareStreamingSource.java
@@ -23,14 +23,16 @@
 import org.apache.paimon.flink.compact.MultiTableScanBase;
 import org.apache.paimon.flink.compact.MultiUnawareBucketTableScan;
 import org.apache.paimon.flink.sink.MultiTableCompactionTaskTypeInfo;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 
-import org.apache.flink.api.common.functions.OpenContext;
-import org.apache.flink.api.connector.source.Boundedness;
-import org.apache.flink.configuration.Configuration;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
-import org.apache.flink.streaming.api.datastream.DataStreamSource;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.operators.StreamSource;
 
 import java.util.regex.Pattern;
 
@@ -40,13 +42,12 @@
 /**
  * It is responsible for monitoring compactor source in stream mode for the table of unaware bucket.
  */
-public class CombinedUnawareStreamingSourceFunction
-        extends CombinedCompactorSourceFunction<MultiTableUnawareAppendCompactionTask> {
+public class CombinedUnawareStreamingSource
+        extends CombinedCompactorSource<MultiTableUnawareAppendCompactionTask> {
 
     private final long monitorInterval;
-    private MultiTableScanBase<MultiTableUnawareAppendCompactionTask> tableScan;
 
-    public CombinedUnawareStreamingSourceFunction(
+    public CombinedUnawareStreamingSource(
             Catalog.Loader catalogLoader,
             Pattern includingPattern,
             Pattern excludingPattern,
@@ -56,39 +57,47 @@ public CombinedUnawareStreamingSourceFunction(
         this.monitorInterval = monitorInterval;
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 1.18-.
-     */
-    public void open(OpenContext openContext) throws Exception {
-        open(new Configuration());
+    @Override
+    public SourceReader<MultiTableUnawareAppendCompactionTask, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
     }
 
-    /**
-     * Do not annotate with <code>@override</code> here to maintain compatibility with Flink 2.0+.
-     */
-    public void open(Configuration parameters) throws Exception {
-        super.open(parameters);
-        tableScan =
-                new MultiUnawareBucketTableScan(
-                        catalogLoader,
-                        includingPattern,
-                        excludingPattern,
-                        databasePattern,
-                        isStreaming,
-                        isRunning);
-    }
+    private class Reader
+            extends AbstractNonCoordinatedSourceReader<MultiTableUnawareAppendCompactionTask> {
+        private MultiTableScanBase<MultiTableUnawareAppendCompactionTask> tableScan;
 
-    @SuppressWarnings("BusyWait")
-    @Override
-    void scanTable() throws Exception {
-        while (isRunning.get()) {
-            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(ctx);
+        @Override
+        public void start() {
+            super.start();
+            tableScan =
+                    new MultiUnawareBucketTableScan(
+                            catalogLoader,
+                            includingPattern,
+                            excludingPattern,
+                            databasePattern,
+                            isStreaming);
+        }
+
+        @Override
+        public InputStatus pollNext(
+                ReaderOutput<MultiTableUnawareAppendCompactionTask> readerOutput) throws Exception {
+            MultiTableScanBase.ScanResult scanResult = tableScan.scanTable(readerOutput);
             if (scanResult == FINISHED) {
-                return;
+                return InputStatus.END_OF_INPUT;
             }
             if (scanResult == IS_EMPTY) {
                 Thread.sleep(monitorInterval);
             }
+            return InputStatus.MORE_AVAILABLE;
+        }
+
+        @Override
+        public void close() throws Exception {
+            super.close();
+            if (tableScan != null) {
+                tableScan.close();
+            }
         }
     }
 
@@ -101,33 +110,18 @@ public static DataStream<MultiTableUnawareAppendCompactionTask> buildSource(
             Pattern databasePattern,
             long monitorInterval) {
 
-        CombinedUnawareStreamingSourceFunction function =
-                new CombinedUnawareStreamingSourceFunction(
+        CombinedUnawareStreamingSource source =
+                new CombinedUnawareStreamingSource(
                         catalogLoader,
                         includingPattern,
                         excludingPattern,
                         databasePattern,
                         monitorInterval);
-        StreamSource<MultiTableUnawareAppendCompactionTask, CombinedUnawareStreamingSourceFunction>
-                sourceOperator = new StreamSource<>(function);
-        boolean isParallel = false;
         MultiTableCompactionTaskTypeInfo compactionTaskTypeInfo =
                 new MultiTableCompactionTaskTypeInfo();
-        return new DataStreamSource<>(
-                        env,
-                        compactionTaskTypeInfo,
-                        sourceOperator,
-                        isParallel,
-                        name,
-                        Boundedness.CONTINUOUS_UNBOUNDED)
-                .forceNonParallel();
-    }
 
-    @Override
-    public void close() throws Exception {
-        super.close();
-        if (tableScan != null) {
-            tableScan.close();
-        }
+        return env.fromSource(
+                        source, WatermarkStrategy.noWatermarks(), name, compactionTaskTypeInfo)
+                .forceNonParallel();
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorSource.java
similarity index 53%
rename from paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
rename to paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorSource.java
index 3805f6f8c536e..4ec0a4f99d9fd 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorFunction.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MonitorSource.java
@@ -18,6 +18,10 @@
 
 package org.apache.paimon.flink.source.operator;
 
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
+import org.apache.paimon.flink.source.SplitListState;
 import org.apache.paimon.flink.utils.JavaTypeInfo;
 import org.apache.paimon.table.BucketMode;
 import org.apache.paimon.table.sink.ChannelComputer;
@@ -27,22 +31,18 @@
 import org.apache.paimon.table.source.Split;
 import org.apache.paimon.table.source.StreamTableScan;
 
-import org.apache.flink.api.common.state.CheckpointListener;
-import org.apache.flink.api.common.state.ListState;
-import org.apache.flink.api.common.state.ListStateDescriptor;
+import org.apache.flink.api.common.eventtime.Watermark;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
-import org.apache.flink.api.common.typeutils.TypeSerializer;
-import org.apache.flink.api.common.typeutils.base.LongSerializer;
+import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
 import org.apache.flink.api.java.tuple.Tuple2;
-import org.apache.flink.api.java.typeutils.runtime.TupleSerializer;
-import org.apache.flink.runtime.state.FunctionInitializationContext;
-import org.apache.flink.runtime.state.FunctionSnapshotContext;
-import org.apache.flink.streaming.api.checkpoint.CheckpointedFunction;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
-import org.apache.flink.streaming.api.watermark.Watermark;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.util.Preconditions;
 import org.slf4j.Logger;
@@ -71,33 +71,23 @@
  * <p>Currently, there are two features that rely on this monitor:
  *
  * <ol>
- *   <li>Consumer-id: rely on this function to do aligned snapshot consumption, and ensure that all
+ *   <li>Consumer-id: rely on this source to do aligned snapshot consumption, and ensure that all
  *       data in a snapshot is consumed within each checkpoint.
  *   <li>Snapshot-watermark: when there is no watermark definition, the default Paimon table will
  *       pass the watermark recorded in the snapshot.
  * </ol>
  */
-public class MonitorFunction extends RichSourceFunction<Split>
-        implements CheckpointedFunction, CheckpointListener {
+public class MonitorSource extends AbstractNonCoordinatedSource<Split> {
 
     private static final long serialVersionUID = 1L;
 
-    private static final Logger LOG = LoggerFactory.getLogger(MonitorFunction.class);
+    private static final Logger LOG = LoggerFactory.getLogger(MonitorSource.class);
 
     private final ReadBuilder readBuilder;
     private final long monitorInterval;
     private final boolean emitSnapshotWatermark;
 
-    private volatile boolean isRunning = true;
-
-    private transient StreamTableScan scan;
-    private transient SourceContext<Split> ctx;
-
-    private transient ListState<Long> checkpointState;
-    private transient ListState<Tuple2<Long, Long>> nextSnapshotState;
-    private transient TreeMap<Long, Long> nextSnapshotPerCheckpoint;
-
-    public MonitorFunction(
+    public MonitorSource(
             ReadBuilder readBuilder, long monitorInterval, boolean emitSnapshotWatermark) {
         this.readBuilder = readBuilder;
         this.monitorInterval = monitorInterval;
@@ -105,40 +95,74 @@ public MonitorFunction(
     }
 
     @Override
-    public void initializeState(FunctionInitializationContext context) throws Exception {
-        this.scan = readBuilder.newStreamScan();
-
-        this.checkpointState =
-                context.getOperatorStateStore()
-                        .getListState(
-                                new ListStateDescriptor<>(
-                                        "next-snapshot", LongSerializer.INSTANCE));
-
-        @SuppressWarnings("unchecked")
-        final Class<Tuple2<Long, Long>> typedTuple =
-                (Class<Tuple2<Long, Long>>) (Class<?>) Tuple2.class;
-        this.nextSnapshotState =
-                context.getOperatorStateStore()
-                        .getListState(
-                                new ListStateDescriptor<>(
-                                        "next-snapshot-per-checkpoint",
-                                        new TupleSerializer<>(
-                                                typedTuple,
-                                                new TypeSerializer[] {
-                                                    LongSerializer.INSTANCE, LongSerializer.INSTANCE
-                                                })));
-
-        this.nextSnapshotPerCheckpoint = new TreeMap<>();
-
-        if (context.isRestored()) {
-            LOG.info("Restoring state for the {}.", getClass().getSimpleName());
+    public Boundedness getBoundedness() {
+        return Boundedness.CONTINUOUS_UNBOUNDED;
+    }
+
+    @Override
+    public SourceReader<Split, SimpleSourceSplit> createReader(
+            SourceReaderContext sourceReaderContext) throws Exception {
+        return new Reader();
+    }
+
+    private class Reader extends AbstractNonCoordinatedSourceReader<Split> {
+        private static final String CHECKPOINT_STATE = "CS";
+        private static final String NEXT_SNAPSHOT_STATE = "NSS";
+
+        private final StreamTableScan scan = readBuilder.newStreamScan();
+        private final SplitListState<Long> checkpointState =
+                new SplitListState<>(CHECKPOINT_STATE, x -> Long.toString(x), Long::parseLong);
+        private final SplitListState<Tuple2<Long, Long>> nextSnapshotState =
+                new SplitListState<>(
+                        NEXT_SNAPSHOT_STATE,
+                        x -> x.f0 + ":" + x.f1,
+                        x ->
+                                Tuple2.of(
+                                        Long.parseLong(x.split(":")[0]),
+                                        Long.parseLong(x.split(":")[1])));
+        private final TreeMap<Long, Long> nextSnapshotPerCheckpoint = new TreeMap<>();
+
+        @Override
+        public void notifyCheckpointComplete(long checkpointId) {
+            NavigableMap<Long, Long> nextSnapshots =
+                    nextSnapshotPerCheckpoint.headMap(checkpointId, true);
+            OptionalLong max = nextSnapshots.values().stream().mapToLong(Long::longValue).max();
+            max.ifPresent(scan::notifyCheckpointComplete);
+            nextSnapshots.clear();
+        }
 
-            List<Long> retrievedStates = new ArrayList<>();
-            for (Long entry : this.checkpointState.get()) {
-                retrievedStates.add(entry);
+        @Override
+        public List<SimpleSourceSplit> snapshotState(long checkpointId) {
+            this.checkpointState.clear();
+            Long nextSnapshot = this.scan.checkpoint();
+            if (nextSnapshot != null) {
+                this.checkpointState.add(nextSnapshot);
+                this.nextSnapshotPerCheckpoint.put(checkpointId, nextSnapshot);
             }
 
-            // given that the parallelism of the function is 1, we can only have 1 retrieved items.
+            List<Tuple2<Long, Long>> nextSnapshots = new ArrayList<>();
+            this.nextSnapshotPerCheckpoint.forEach((k, v) -> nextSnapshots.add(new Tuple2<>(k, v)));
+            this.nextSnapshotState.update(nextSnapshots);
+
+            if (LOG.isDebugEnabled()) {
+                LOG.debug("{} checkpoint {}.", getClass().getSimpleName(), nextSnapshot);
+            }
+
+            List<SimpleSourceSplit> results = new ArrayList<>();
+            results.addAll(checkpointState.snapshotState());
+            results.addAll(nextSnapshotState.snapshotState());
+            return results;
+        }
+
+        @Override
+        public void addSplits(List<SimpleSourceSplit> list) {
+            LOG.info("Restoring state for the {}.", getClass().getSimpleName());
+            checkpointState.restoreState(list);
+            nextSnapshotState.restoreState(list);
+
+            List<Long> retrievedStates = checkpointState.get();
+
+            // given that the parallelism of the source is 1, we can only have 1 retrieved items.
             Preconditions.checkArgument(
                     retrievedStates.size() <= 1,
                     getClass().getSimpleName() + " retrieved invalid state.");
@@ -150,80 +174,31 @@ public void initializeState(FunctionInitializationContext context) throws Except
             for (Tuple2<Long, Long> tuple2 : nextSnapshotState.get()) {
                 nextSnapshotPerCheckpoint.put(tuple2.f0, tuple2.f1);
             }
-        } else {
-            LOG.info("No state to restore for the {}.", getClass().getSimpleName());
         }
-    }
-
-    @Override
-    public void snapshotState(FunctionSnapshotContext ctx) throws Exception {
-        this.checkpointState.clear();
-        Long nextSnapshot = this.scan.checkpoint();
-        if (nextSnapshot != null) {
-            this.checkpointState.add(nextSnapshot);
-            this.nextSnapshotPerCheckpoint.put(ctx.getCheckpointId(), nextSnapshot);
-        }
-
-        List<Tuple2<Long, Long>> nextSnapshots = new ArrayList<>();
-        this.nextSnapshotPerCheckpoint.forEach((k, v) -> nextSnapshots.add(new Tuple2<>(k, v)));
-        this.nextSnapshotState.update(nextSnapshots);
 
-        if (LOG.isDebugEnabled()) {
-            LOG.debug("{} checkpoint {}.", getClass().getSimpleName(), nextSnapshot);
-        }
-    }
-
-    @SuppressWarnings("BusyWait")
-    @Override
-    public void run(SourceContext<Split> ctx) throws Exception {
-        this.ctx = ctx;
-        while (isRunning) {
+        @Override
+        public InputStatus pollNext(ReaderOutput<Split> readerOutput) throws Exception {
             boolean isEmpty;
-            synchronized (ctx.getCheckpointLock()) {
-                if (!isRunning) {
-                    return;
-                }
-                try {
-                    List<Split> splits = scan.plan().splits();
-                    isEmpty = splits.isEmpty();
-                    splits.forEach(ctx::collect);
-
-                    if (emitSnapshotWatermark) {
-                        Long watermark = scan.watermark();
-                        if (watermark != null) {
-                            ctx.emitWatermark(new Watermark(watermark));
-                        }
+            try {
+                List<Split> splits = scan.plan().splits();
+                isEmpty = splits.isEmpty();
+                splits.forEach(readerOutput::collect);
+
+                if (emitSnapshotWatermark) {
+                    Long watermark = scan.watermark();
+                    if (watermark != null) {
+                        readerOutput.emitWatermark(new Watermark(watermark));
                     }
-                } catch (EndOfScanException esf) {
-                    LOG.info("Catching EndOfStreamException, the stream is finished.");
-                    return;
                 }
+            } catch (EndOfScanException esf) {
+                LOG.info("Catching EndOfStreamException, the stream is finished.");
+                return InputStatus.END_OF_INPUT;
             }
 
             if (isEmpty) {
                 Thread.sleep(monitorInterval);
             }
-        }
-    }
-
-    @Override
-    public void notifyCheckpointComplete(long checkpointId) {
-        NavigableMap<Long, Long> nextSnapshots =
-                nextSnapshotPerCheckpoint.headMap(checkpointId, true);
-        OptionalLong max = nextSnapshots.values().stream().mapToLong(Long::longValue).max();
-        max.ifPresent(scan::notifyCheckpointComplete);
-        nextSnapshots.clear();
-    }
-
-    @Override
-    public void cancel() {
-        // this is to cover the case where cancel() is called before the run()
-        if (ctx != null) {
-            synchronized (ctx.getCheckpointLock()) {
-                isRunning = false;
-            }
-        } else {
-            isRunning = false;
+            return InputStatus.MORE_AVAILABLE;
         }
     }
 
@@ -237,9 +212,10 @@ public static DataStream<RowData> buildSource(
             boolean shuffleBucketWithPartition,
             BucketMode bucketMode) {
         SingleOutputStreamOperator<Split> singleOutputStreamOperator =
-                env.addSource(
-                                new MonitorFunction(
+                env.fromSource(
+                                new MonitorSource(
                                         readBuilder, monitorInterval, emitSnapshotWatermark),
+                                WatermarkStrategy.noWatermarks(),
                                 name + "-Monitor",
                                 new JavaTypeInfo<>(Split.class))
                         .forceNonParallel();
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiTablesReadOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiTablesReadOperator.java
index 73d46ae1e3f19..fbc8bb9d756a3 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiTablesReadOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiTablesReadOperator.java
@@ -52,9 +52,8 @@
 
 /**
  * The operator that reads the Tuple2<{@link Split}, String> received from the preceding {@link
- * CombinedAwareBatchSourceFunction} or {@link CombinedAwareStreamingSourceFunction}. Contrary to
- * the {@link CombinedCompactorSourceFunction} which has a parallelism of 1, this operator can have
- * DOP > 1.
+ * CombinedAwareBatchSource} or {@link CombinedAwareStreamingSource}. Contrary to the {@link
+ * CombinedCompactorSource} which has a parallelism of 1, this operator can have DOP > 1.
  */
 public class MultiTablesReadOperator extends AbstractStreamOperator<RowData>
         implements OneInputStreamOperator<Tuple2<Split, String>, RowData> {
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiUnawareTablesReadOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiUnawareTablesReadOperator.java
index c501c2519b412..0864741a178f1 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiUnawareTablesReadOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/MultiUnawareTablesReadOperator.java
@@ -44,7 +44,7 @@
 /**
  * The operator is used for historical partition compaction. It reads {@link
  * MultiTableUnawareAppendCompactionTask} received from the preceding {@link
- * CombinedUnawareBatchSourceFunction} and filter partitions which is not historical.
+ * CombinedUnawareBatchSource} and filter partitions which is not historical.
  */
 public class MultiUnawareTablesReadOperator
         extends AbstractStreamOperator<MultiTableUnawareAppendCompactionTask>
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
index d884724c67490..ccc66194560e9 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/source/operator/ReadOperator.java
@@ -38,8 +38,8 @@
 
 /**
  * The operator that reads the {@link Split splits} received from the preceding {@link
- * MonitorFunction}. Contrary to the {@link MonitorFunction} which has a parallelism of 1, this
- * operator can have DOP > 1.
+ * MonitorSource}. Contrary to the {@link MonitorSource} which has a parallelism of 1, this operator
+ * can have DOP > 1.
  */
 public class ReadOperator extends AbstractStreamOperator<RowData>
         implements OneInputStreamOperator<Split, RowData> {
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileStoreITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileStoreITCase.java
index 6a2c7b071d2d1..5245114e80eed 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileStoreITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FileStoreITCase.java
@@ -36,6 +36,7 @@
 import org.apache.paimon.utils.BranchManager;
 import org.apache.paimon.utils.FailingFileIO;
 
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.common.functions.MapFunction;
 import org.apache.flink.api.connector.source.Boundedness;
 import org.apache.flink.api.dag.Transformation;
@@ -450,7 +451,12 @@ private void sinkAndValidate(
             throw new UnsupportedOperationException();
         }
         DataStreamSource<RowData> source =
-                env.addSource(new FiniteTestSource<>(src, true), InternalTypeInfo.of(TABLE_TYPE));
+                env.fromSource(
+                        new FiniteTestSource<>(src, true),
+                        WatermarkStrategy.noWatermarks(),
+                        "FiniteTestSource",
+                        InternalTypeInfo.of(TABLE_TYPE));
+        source.forceNonParallel();
         new FlinkSinkBuilder(table).forRowData(source).build();
         env.execute();
         assertThat(iterator.collect(expected.length)).containsExactlyInAnyOrder(expected);
@@ -521,9 +527,13 @@ public static DataStreamSource<RowData> buildTestSource(
             StreamExecutionEnvironment env, boolean isBatch) {
         return isBatch
                 ? env.fromCollection(SOURCE_DATA, InternalTypeInfo.of(TABLE_TYPE))
-                : env.addSource(
-                        new FiniteTestSource<>(SOURCE_DATA, false),
-                        InternalTypeInfo.of(TABLE_TYPE));
+                : (DataStreamSource<RowData>)
+                        env.fromSource(
+                                        new FiniteTestSource<>(SOURCE_DATA, false),
+                                        WatermarkStrategy.noWatermarks(),
+                                        "FiniteTestSource",
+                                        InternalTypeInfo.of(TABLE_TYPE))
+                                .forceNonParallel();
     }
 
     public static List<Row> executeAndCollect(DataStream<RowData> source) throws Exception {
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FiniteTestSource.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FiniteTestSource.java
index 9c5254d6283b7..6691b9c095140 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FiniteTestSource.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/FiniteTestSource.java
@@ -18,16 +18,18 @@
 
 package org.apache.paimon.flink;
 
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
+import org.apache.paimon.flink.source.SplitListState;
 import org.apache.paimon.utils.Preconditions;
 
-import org.apache.flink.api.common.state.CheckpointListener;
-import org.apache.flink.api.common.state.ListState;
-import org.apache.flink.api.common.state.ListStateDescriptor;
-import org.apache.flink.api.common.typeutils.base.IntSerializer;
-import org.apache.flink.runtime.state.FunctionInitializationContext;
-import org.apache.flink.runtime.state.FunctionSnapshotContext;
+import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.checkpoint.CheckpointedFunction;
-import org.apache.flink.streaming.api.functions.source.SourceFunction;
 
 import java.util.ArrayList;
 import java.util.List;
@@ -39,8 +41,7 @@
  *
  * <p>The reason this class is rewritten is to support {@link CheckpointedFunction}.
  */
-public class FiniteTestSource<T>
-        implements SourceFunction<T>, CheckpointedFunction, CheckpointListener {
+public class FiniteTestSource<T> extends AbstractNonCoordinatedSource<T> {
 
     private static final long serialVersionUID = 1L;
 
@@ -48,27 +49,78 @@ public class FiniteTestSource<T>
 
     private final boolean emitOnce;
 
-    private volatile boolean running = true;
-
-    private transient int numCheckpointsComplete;
-
-    private transient ListState<Integer> checkpointedState;
-
-    private volatile int numTimesEmitted;
-
     public FiniteTestSource(List<T> elements, boolean emitOnce) {
         this.elements = elements;
         this.emitOnce = emitOnce;
     }
 
     @Override
-    public void initializeState(FunctionInitializationContext context) throws Exception {
-        this.checkpointedState =
-                context.getOperatorStateStore()
-                        .getListState(
-                                new ListStateDescriptor<>("emit-times", IntSerializer.INSTANCE));
+    public Boundedness getBoundedness() {
+        return Boundedness.BOUNDED;
+    }
+
+    @Override
+    public SourceReader<T, SimpleSourceSplit> createReader(SourceReaderContext sourceReaderContext)
+            throws Exception {
+        return new Reader<>(elements, emitOnce);
+    }
+
+    private static class Reader<T> extends AbstractNonCoordinatedSourceReader<T> {
+
+        private final List<T> elements;
+
+        private final boolean emitOnce;
+
+        private final SplitListState<Integer> checkpointedState =
+                new SplitListState<>("emit-times", x -> Integer.toString(x), Integer::parseInt);
+
+        private int numTimesEmitted = 0;
+
+        private int numCheckpointsComplete;
+
+        private Integer checkpointToAwait;
+
+        private Reader(List<T> elements, boolean emitOnce) {
+            this.elements = elements;
+            this.emitOnce = emitOnce;
+            this.numCheckpointsComplete = 0;
+        }
+
+        @Override
+        public synchronized InputStatus pollNext(ReaderOutput<T> readerOutput) {
+            if (checkpointToAwait == null) {
+                checkpointToAwait = numCheckpointsComplete + 2;
+            }
+            switch (numTimesEmitted) {
+                case 0:
+                    emitElements(readerOutput, false);
+                    if (numCheckpointsComplete < checkpointToAwait) {
+                        return InputStatus.MORE_AVAILABLE;
+                    }
+                    emitElements(readerOutput, true);
+                    if (numCheckpointsComplete < checkpointToAwait + 2) {
+                        return InputStatus.MORE_AVAILABLE;
+                    }
+                    break;
+                case 1:
+                    emitElements(readerOutput, true);
+                    if (numCheckpointsComplete < checkpointToAwait) {
+                        return InputStatus.MORE_AVAILABLE;
+                    }
+                    break;
+                case 2:
+                    // Maybe missed notifyCheckpointComplete, wait next notifyCheckpointComplete
+                    if (numCheckpointsComplete < checkpointToAwait) {
+                        return InputStatus.MORE_AVAILABLE;
+                    }
+                    break;
+            }
+            return InputStatus.END_OF_INPUT;
+        }
 
-        if (context.isRestored()) {
+        @Override
+        public void addSplits(List<SimpleSourceSplit> list) {
+            checkpointedState.restoreState(list);
             List<Integer> retrievedStates = new ArrayList<>();
             for (Integer entry : this.checkpointedState.get()) {
                 retrievedStates.add(entry);
@@ -85,76 +137,27 @@ public void initializeState(FunctionInitializationContext context) throws Except
                     getClass().getSimpleName()
                             + " retrieved invalid numTimesEmitted: "
                             + numTimesEmitted);
-        } else {
-            this.numTimesEmitted = 0;
         }
-    }
 
-    @Override
-    public void run(SourceContext<T> ctx) throws Exception {
-        switch (numTimesEmitted) {
-            case 0:
-                emitElementsAndWaitForCheckpoints(ctx, false);
-                emitElementsAndWaitForCheckpoints(ctx, true);
-                break;
-            case 1:
-                emitElementsAndWaitForCheckpoints(ctx, true);
-                break;
-            case 2:
-                // Maybe missed notifyCheckpointComplete, wait next notifyCheckpointComplete
-                final Object lock = ctx.getCheckpointLock();
-                synchronized (lock) {
-                    int checkpointToAwait = numCheckpointsComplete + 2;
-                    while (running && numCheckpointsComplete < checkpointToAwait) {
-                        lock.wait(1);
-                    }
-                }
-                break;
+        @Override
+        public List<SimpleSourceSplit> snapshotState(long l) {
+            this.checkpointedState.clear();
+            this.checkpointedState.add(this.numTimesEmitted);
+            return this.checkpointedState.snapshotState();
         }
-    }
 
-    private void emitElementsAndWaitForCheckpoints(SourceContext<T> ctx, boolean isSecond)
-            throws InterruptedException {
-        final Object lock = ctx.getCheckpointLock();
+        @Override
+        public void notifyCheckpointComplete(long checkpointId) {
+            numCheckpointsComplete++;
+        }
 
-        final int checkpointToAwait;
-        synchronized (lock) {
-            checkpointToAwait = numCheckpointsComplete + 2;
+        private void emitElements(ReaderOutput<T> readerOutput, boolean isSecond) {
             if (!isSecond || !emitOnce) {
                 for (T t : elements) {
-                    ctx.collect(t);
+                    readerOutput.collect(t);
                 }
             }
             numTimesEmitted++;
         }
-
-        synchronized (lock) {
-            while (running && numCheckpointsComplete < checkpointToAwait) {
-                lock.wait(1);
-            }
-        }
-    }
-
-    @Override
-    public void cancel() {
-        running = false;
-    }
-
-    @Override
-    public void notifyCheckpointComplete(long checkpointId) {
-        numCheckpointsComplete++;
-    }
-
-    @Override
-    public void notifyCheckpointAborted(long checkpointId) {}
-
-    @Override
-    public void snapshotState(FunctionSnapshotContext context) throws Exception {
-        Preconditions.checkState(
-                this.checkpointedState != null,
-                "The " + getClass().getSimpleName() + " has not been properly initialized.");
-
-        this.checkpointedState.clear();
-        this.checkpointedState.add(this.numTimesEmitted);
     }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SerializableRowData.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SerializableRowData.java
index 594affc124ebb..75b96cbe02eb3 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SerializableRowData.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/SerializableRowData.java
@@ -47,8 +47,10 @@ public SerializableRowData(RowData row, TypeSerializer<RowData> serializer) {
         this.serializer = serializer;
     }
 
-    private void writeObject(ObjectOutputStream out) throws IOException {
+    private synchronized void writeObject(ObjectOutputStream out) throws IOException {
         out.defaultWriteObject();
+        // This following invocation needs to be synchronized to avoid racing problems when the
+        // serializer is reused across multiple subtasks.
         serializer.serialize(row, new DataOutputViewStreamWrapper(out));
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
index 6ca78b088fb79..fb8bee5d59620 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/UnawareBucketAppendOnlyTableITCase.java
@@ -20,7 +20,9 @@
 
 import org.apache.paimon.Snapshot;
 import org.apache.paimon.data.InternalRow;
-import org.apache.paimon.flink.utils.RuntimeContextUtils;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSource;
+import org.apache.paimon.flink.source.AbstractNonCoordinatedSourceReader;
+import org.apache.paimon.flink.source.SimpleSourceSplit;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.local.LocalFileIO;
 import org.apache.paimon.reader.RecordReader;
@@ -30,9 +32,14 @@
 import org.apache.paimon.utils.FailingFileIO;
 import org.apache.paimon.utils.TimeUtils;
 
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
+import org.apache.flink.api.connector.source.Boundedness;
+import org.apache.flink.api.connector.source.ReaderOutput;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.api.connector.source.SourceReaderContext;
+import org.apache.flink.core.io.InputStatus;
 import org.apache.flink.streaming.api.datastream.DataStream;
 import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
-import org.apache.flink.streaming.api.functions.source.RichParallelSourceFunction;
 import org.apache.flink.table.api.bridge.java.StreamTableEnvironment;
 import org.apache.flink.table.planner.factories.TestValuesTableFactory;
 import org.apache.flink.types.Row;
@@ -380,7 +387,12 @@ public void testStatelessWriter() throws Exception {
                         .checkpointIntervalMs(500)
                         .build();
         DataStream<Integer> source =
-                env.addSource(new TestStatelessWriterSource(table)).setParallelism(2).forward();
+                env.fromSource(
+                                new TestStatelessWriterSource(table),
+                                WatermarkStrategy.noWatermarks(),
+                                "TestStatelessWriterSource")
+                        .setParallelism(2)
+                        .forward();
 
         StreamTableEnvironment tEnv = StreamTableEnvironment.create(env);
         tEnv.registerCatalog("mycat", sEnv.getCatalog("PAIMON").get());
@@ -392,46 +404,59 @@ public void testStatelessWriter() throws Exception {
                 .containsExactlyInAnyOrder(Row.of(1, "test"), Row.of(2, "test"));
     }
 
-    private static class TestStatelessWriterSource extends RichParallelSourceFunction<Integer> {
+    private static class TestStatelessWriterSource extends AbstractNonCoordinatedSource<Integer> {
 
         private final FileStoreTable table;
 
-        private volatile boolean isRunning = true;
-
         private TestStatelessWriterSource(FileStoreTable table) {
             this.table = table;
         }
 
         @Override
-        public void run(SourceContext<Integer> sourceContext) throws Exception {
-            int taskId = RuntimeContextUtils.getIndexOfThisSubtask(getRuntimeContext());
-            // wait some time in parallelism #2,
-            // so that it does not commit in the same checkpoint with parallelism #1
-            int waitCount = (taskId == 0 ? 0 : 10);
-
-            while (isRunning) {
-                synchronized (sourceContext.getCheckpointLock()) {
-                    if (taskId == 0) {
+        public Boundedness getBoundedness() {
+            return Boundedness.CONTINUOUS_UNBOUNDED;
+        }
+
+        @Override
+        public SourceReader<Integer, SimpleSourceSplit> createReader(
+                SourceReaderContext sourceReaderContext) throws Exception {
+            return new Reader(sourceReaderContext.getIndexOfSubtask());
+        }
+
+        private class Reader extends AbstractNonCoordinatedSourceReader<Integer> {
+            private final int taskId;
+            private int waitCount;
+
+            private Reader(int taskId) {
+                this.taskId = taskId;
+                this.waitCount = (taskId == 0 ? 0 : 10);
+            }
+
+            @Override
+            public InputStatus pollNext(ReaderOutput<Integer> readerOutput) throws Exception {
+                if (taskId == 0) {
+                    if (waitCount == 0) {
+                        readerOutput.collect(1);
+                    } else if (countNumRecords() >= 1) {
+                        // wait for the record to commit before exiting
+                        Thread.sleep(1000);
+                        return InputStatus.END_OF_INPUT;
+                    }
+                } else {
+                    int numRecords = countNumRecords();
+                    if (numRecords >= 1) {
                         if (waitCount == 0) {
-                            sourceContext.collect(1);
-                        } else if (countNumRecords() >= 1) {
-                            // wait for the record to commit before exiting
-                            break;
-                        }
-                    } else {
-                        int numRecords = countNumRecords();
-                        if (numRecords >= 1) {
-                            if (waitCount == 0) {
-                                sourceContext.collect(2);
-                            } else if (countNumRecords() >= 2) {
-                                // make sure the next checkpoint is successful
-                                break;
-                            }
+                            readerOutput.collect(2);
+                        } else if (countNumRecords() >= 2) {
+                            // make sure the next checkpoint is successful
+                            Thread.sleep(1000);
+                            return InputStatus.END_OF_INPUT;
                         }
                     }
-                    waitCount--;
                 }
+                waitCount--;
                 Thread.sleep(1000);
+                return InputStatus.MORE_AVAILABLE;
             }
         }
 
@@ -447,11 +472,6 @@ private int countNumRecords() throws Exception {
             }
             return ret;
         }
-
-        @Override
-        public void cancel() {
-            isRunning = false;
-        }
     }
 
     @Override
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
index 0bce8c8901ea8..0cd969707cfa6 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/OperatorSourceTest.java
@@ -33,12 +33,17 @@
 import org.apache.paimon.table.source.TableRead;
 import org.apache.paimon.types.DataTypes;
 
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.metrics.MetricGroup;
 import org.apache.flink.runtime.checkpoint.OperatorSubtaskState;
-import org.apache.flink.streaming.api.functions.source.SourceFunction;
-import org.apache.flink.streaming.api.operators.StreamSource;
+import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
+import org.apache.flink.streaming.api.operators.SourceOperator;
 import org.apache.flink.streaming.api.watermark.Watermark;
+import org.apache.flink.streaming.runtime.io.PushingAsyncDataInput;
+import org.apache.flink.streaming.runtime.streamrecord.LatencyMarker;
+import org.apache.flink.streaming.runtime.streamrecord.RecordAttributes;
 import org.apache.flink.streaming.runtime.streamrecord.StreamRecord;
+import org.apache.flink.streaming.runtime.watermarkstatus.WatermarkStatus;
 import org.apache.flink.streaming.util.AbstractStreamOperatorTestHarness;
 import org.apache.flink.streaming.util.OneInputStreamOperatorTestHarness;
 import org.apache.flink.table.data.GenericRowData;
@@ -46,6 +51,7 @@
 import org.apache.flink.table.runtime.typeutils.InternalSerializers;
 import org.apache.flink.table.types.logical.IntType;
 import org.apache.flink.table.types.logical.RowType;
+import org.apache.flink.util.CloseableIterator;
 import org.apache.flink.util.function.SupplierWithException;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -58,11 +64,13 @@
 import java.util.List;
 import java.util.concurrent.ArrayBlockingQueue;
 import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicReference;
 
 import static org.apache.paimon.CoreOptions.CONSUMER_ID;
 import static org.assertj.core.api.Assertions.assertThat;
 
-/** Test for {@link MonitorFunction} and {@link ReadOperator}. */
+/** Test for {@link MonitorSource} and {@link ReadOperator}. */
 public class OperatorSourceTest {
 
     @TempDir Path tempDir;
@@ -114,28 +122,39 @@ private List<List<Integer>> readSplit(Split split) throws IOException {
     }
 
     @Test
-    public void testMonitorFunction() throws Exception {
+    public void testMonitorSource() throws Exception {
+        StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
         // 1. run first
         OperatorSubtaskState snapshot;
         {
-            MonitorFunction function = new MonitorFunction(table.newReadBuilder(), 10, false);
-            StreamSource<Split, MonitorFunction> src = new StreamSource<>(function);
+            MonitorSource source = new MonitorSource(table.newReadBuilder(), 10, false);
+            TestingSourceOperator<Split> operator =
+                    (TestingSourceOperator<Split>)
+                            TestingSourceOperator.createTestOperator(
+                                    source.createReader(null),
+                                    WatermarkStrategy.noWatermarks(),
+                                    false);
             AbstractStreamOperatorTestHarness<Split> testHarness =
-                    new AbstractStreamOperatorTestHarness<>(src, 1, 1, 0);
+                    new AbstractStreamOperatorTestHarness<>(operator, 1, 1, 0);
             testHarness.open();
-            snapshot = testReadSplit(function, () -> testHarness.snapshot(0, 0), 1, 1, 1);
+            snapshot = testReadSplit(operator, () -> testHarness.snapshot(0, 0), 1, 1, 1);
         }
 
         // 2. restore from state
         {
-            MonitorFunction functionCopy1 = new MonitorFunction(table.newReadBuilder(), 10, false);
-            StreamSource<Split, MonitorFunction> srcCopy1 = new StreamSource<>(functionCopy1);
+            MonitorSource sourceCopy1 = new MonitorSource(table.newReadBuilder(), 10, false);
+            TestingSourceOperator<Split> operatorCopy1 =
+                    (TestingSourceOperator<Split>)
+                            TestingSourceOperator.createTestOperator(
+                                    sourceCopy1.createReader(null),
+                                    WatermarkStrategy.noWatermarks(),
+                                    false);
             AbstractStreamOperatorTestHarness<Split> testHarnessCopy1 =
-                    new AbstractStreamOperatorTestHarness<>(srcCopy1, 1, 1, 0);
+                    new AbstractStreamOperatorTestHarness<>(operatorCopy1, 1, 1, 0);
             testHarnessCopy1.initializeState(snapshot);
             testHarnessCopy1.open();
             testReadSplit(
-                    functionCopy1,
+                    operatorCopy1,
                     () -> {
                         testHarnessCopy1.snapshot(1, 1);
                         testHarnessCopy1.notifyOfCompletedCheckpoint(1);
@@ -148,12 +167,17 @@ public void testMonitorFunction() throws Exception {
 
         // 3. restore from consumer id
         {
-            MonitorFunction functionCopy2 = new MonitorFunction(table.newReadBuilder(), 10, false);
-            StreamSource<Split, MonitorFunction> srcCopy2 = new StreamSource<>(functionCopy2);
+            MonitorSource sourceCopy2 = new MonitorSource(table.newReadBuilder(), 10, false);
+            TestingSourceOperator<Split> operatorCopy2 =
+                    (TestingSourceOperator<Split>)
+                            TestingSourceOperator.createTestOperator(
+                                    sourceCopy2.createReader(null),
+                                    WatermarkStrategy.noWatermarks(),
+                                    false);
             AbstractStreamOperatorTestHarness<Split> testHarnessCopy2 =
-                    new AbstractStreamOperatorTestHarness<>(srcCopy2, 1, 1, 0);
+                    new AbstractStreamOperatorTestHarness<>(operatorCopy2, 1, 1, 0);
             testHarnessCopy2.open();
-            testReadSplit(functionCopy2, () -> null, 3, 3, 3);
+            testReadSplit(operatorCopy2, () -> null, 3, 3, 3);
         }
     }
 
@@ -247,7 +271,7 @@ public void testReadOperatorMetricsRegisterAndUpdate() throws Exception {
     }
 
     private <T> T testReadSplit(
-            MonitorFunction function,
+            SourceOperator<Split, ?> operator,
             SupplierWithException<T, Exception> beforeClose,
             int a,
             int b,
@@ -255,20 +279,36 @@ private <T> T testReadSplit(
             throws Exception {
         Throwable[] error = new Throwable[1];
         ArrayBlockingQueue<Split> queue = new ArrayBlockingQueue<>(10);
+        AtomicReference<CloseableIterator<Split>> iteratorRef = new AtomicReference<>();
 
-        DummySourceContext sourceContext =
-                new DummySourceContext() {
+        PushingAsyncDataInput.DataOutput<Split> output =
+                new PushingAsyncDataInput.DataOutput<Split>() {
                     @Override
-                    public void collect(Split element) {
-                        queue.add(element);
+                    public void emitRecord(StreamRecord<Split> streamRecord) {
+                        queue.add(streamRecord.getValue());
                     }
+
+                    @Override
+                    public void emitWatermark(Watermark watermark) {}
+
+                    @Override
+                    public void emitWatermarkStatus(WatermarkStatus watermarkStatus) {}
+
+                    @Override
+                    public void emitLatencyMarker(LatencyMarker latencyMarker) {}
+
+                    @Override
+                    public void emitRecordAttributes(RecordAttributes recordAttributes) {}
                 };
 
+        AtomicBoolean isRunning = new AtomicBoolean(true);
         Thread runner =
                 new Thread(
                         () -> {
                             try {
-                                function.run(sourceContext);
+                                while (isRunning.get()) {
+                                    operator.emitNext(output);
+                                }
                             } catch (Throwable t) {
                                 t.printStackTrace();
                                 error[0] = t;
@@ -282,34 +322,15 @@ public void collect(Split element) {
         assertThat(readSplit(split)).containsExactlyInAnyOrder(Arrays.asList(a, b, c));
 
         T t = beforeClose.get();
-        function.cancel();
+        CloseableIterator<Split> iterator = iteratorRef.get();
+        if (iterator != null) {
+            iterator.close();
+        }
+        isRunning.set(false);
         runner.join();
 
         assertThat(error[0]).isNull();
 
         return t;
     }
-
-    private abstract static class DummySourceContext
-            implements SourceFunction.SourceContext<Split> {
-
-        private final Object lock = new Object();
-
-        @Override
-        public void collectWithTimestamp(Split element, long timestamp) {}
-
-        @Override
-        public void emitWatermark(Watermark mark) {}
-
-        @Override
-        public void markAsTemporarilyIdle() {}
-
-        @Override
-        public Object getCheckpointLock() {
-            return lock;
-        }
-
-        @Override
-        public void close() {}
-    }
 }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/TestingSourceOperator.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/TestingSourceOperator.java
new file mode 100644
index 0000000000000..77b44d5b0e5c7
--- /dev/null
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/source/operator/TestingSourceOperator.java
@@ -0,0 +1,184 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.flink.source.operator;
+
+import org.apache.paimon.flink.source.SimpleSourceSplit;
+import org.apache.paimon.flink.source.SimpleSourceSplitSerializer;
+
+import org.apache.flink.api.common.ExecutionConfig;
+import org.apache.flink.api.common.eventtime.WatermarkStrategy;
+import org.apache.flink.api.common.state.OperatorStateStore;
+import org.apache.flink.api.connector.source.SourceReader;
+import org.apache.flink.configuration.Configuration;
+import org.apache.flink.core.fs.CloseableRegistry;
+import org.apache.flink.runtime.execution.Environment;
+import org.apache.flink.runtime.metrics.groups.UnregisteredMetricGroups;
+import org.apache.flink.runtime.operators.coordination.OperatorEvent;
+import org.apache.flink.runtime.operators.coordination.OperatorEventGateway;
+import org.apache.flink.runtime.operators.testutils.DummyEnvironment;
+import org.apache.flink.runtime.operators.testutils.MockEnvironmentBuilder;
+import org.apache.flink.runtime.state.AbstractStateBackend;
+import org.apache.flink.runtime.state.OperatorStateBackendParametersImpl;
+import org.apache.flink.runtime.state.StateInitializationContext;
+import org.apache.flink.runtime.state.StateInitializationContextImpl;
+import org.apache.flink.runtime.state.hashmap.HashMapStateBackend;
+import org.apache.flink.streaming.api.operators.SourceOperator;
+import org.apache.flink.streaming.api.operators.StreamOperatorParameters;
+import org.apache.flink.streaming.api.operators.StreamingRuntimeContext;
+import org.apache.flink.streaming.runtime.tasks.ProcessingTimeService;
+import org.apache.flink.streaming.runtime.tasks.SourceOperatorStreamTask;
+import org.apache.flink.streaming.runtime.tasks.TestProcessingTimeService;
+import org.apache.flink.streaming.util.MockOutput;
+import org.apache.flink.streaming.util.MockStreamConfig;
+import org.apache.flink.streaming.util.MockStreamingRuntimeContext;
+
+import java.util.ArrayList;
+import java.util.Collections;
+
+/**
+ * A SourceOperator extension to simplify test setup.
+ *
+ * <p>This class is implemented in reference to {@link
+ * org.apache.flink.streaming.api.operators.source.TestingSourceOperator}.
+ *
+ * <p>See <a
+ * href="https://github.com/apache/flink/pull/12306/files#diff-bb7687690ffa79fd86950aa23171431fcf707246ca4620d79361a6612ba7b828">Flink
+ * PR that introduced this class</a>
+ */
+public class TestingSourceOperator<T> extends SourceOperator<T, SimpleSourceSplit> {
+
+    private static final long serialVersionUID = 1L;
+
+    private final int subtaskIndex;
+    private final int parallelism;
+
+    public TestingSourceOperator(
+            StreamOperatorParameters<T> parameters,
+            SourceReader<T, SimpleSourceSplit> reader,
+            WatermarkStrategy<T> watermarkStrategy,
+            ProcessingTimeService timeService,
+            boolean emitProgressiveWatermarks) {
+
+        this(
+                parameters,
+                reader,
+                watermarkStrategy,
+                timeService,
+                new TestingOperatorEventGateway(),
+                1,
+                5,
+                emitProgressiveWatermarks);
+    }
+
+    public TestingSourceOperator(
+            StreamOperatorParameters<T> parameters,
+            SourceReader<T, SimpleSourceSplit> reader,
+            WatermarkStrategy<T> watermarkStrategy,
+            ProcessingTimeService timeService,
+            OperatorEventGateway eventGateway,
+            int subtaskIndex,
+            int parallelism,
+            boolean emitProgressiveWatermarks) {
+
+        super(
+                (context) -> reader,
+                eventGateway,
+                new SimpleSourceSplitSerializer(),
+                watermarkStrategy,
+                timeService,
+                new Configuration(),
+                "localhost",
+                emitProgressiveWatermarks,
+                () -> false);
+
+        this.subtaskIndex = subtaskIndex;
+        this.parallelism = parallelism;
+        this.metrics = UnregisteredMetricGroups.createUnregisteredOperatorMetricGroup();
+        initSourceMetricGroup();
+
+        // unchecked wrapping is okay to keep tests simpler
+        try {
+            initReader();
+        } catch (Exception e) {
+            throw new RuntimeException(e);
+        }
+
+        setup(parameters.getContainingTask(), parameters.getStreamConfig(), parameters.getOutput());
+    }
+
+    @Override
+    public StreamingRuntimeContext getRuntimeContext() {
+        return new MockStreamingRuntimeContext(false, parallelism, subtaskIndex);
+    }
+
+    // this is overridden to avoid complex mock injection through the "containingTask"
+    @Override
+    public ExecutionConfig getExecutionConfig() {
+        ExecutionConfig cfg = new ExecutionConfig();
+        cfg.setAutoWatermarkInterval(100);
+        return cfg;
+    }
+
+    public static <T> SourceOperator<T, SimpleSourceSplit> createTestOperator(
+            SourceReader<T, SimpleSourceSplit> reader,
+            WatermarkStrategy<T> watermarkStrategy,
+            boolean emitProgressiveWatermarks)
+            throws Exception {
+
+        AbstractStateBackend abstractStateBackend = new HashMapStateBackend();
+        Environment env = new MockEnvironmentBuilder().build();
+        CloseableRegistry cancelStreamRegistry = new CloseableRegistry();
+        final OperatorStateStore operatorStateStore =
+                abstractStateBackend.createOperatorStateBackend(
+                        new OperatorStateBackendParametersImpl(
+                                env,
+                                "test-operator",
+                                Collections.emptyList(),
+                                cancelStreamRegistry));
+
+        final StateInitializationContext stateContext =
+                new StateInitializationContextImpl(null, operatorStateStore, null, null, null);
+
+        TestProcessingTimeService timeService = new TestProcessingTimeService();
+        timeService.setCurrentTime(Integer.MAX_VALUE); // start somewhere that is not zero
+
+        final SourceOperator<T, SimpleSourceSplit> sourceOperator =
+                new TestingSourceOperator<>(
+                        new StreamOperatorParameters<>(
+                                new SourceOperatorStreamTask<Integer>(new DummyEnvironment()),
+                                new MockStreamConfig(new Configuration(), 1),
+                                new MockOutput<>(new ArrayList<>()),
+                                null,
+                                null,
+                                null),
+                        reader,
+                        watermarkStrategy,
+                        timeService,
+                        emitProgressiveWatermarks);
+        sourceOperator.initializeState(stateContext);
+        sourceOperator.open();
+
+        return sourceOperator;
+    }
+
+    private static class TestingOperatorEventGateway implements OperatorEventGateway {
+        @Override
+        public void sendEventToCoordinator(OperatorEvent event) {}
+    }
+}

From 47a8871aeb5cba3267192d4971ac82e340a30956 Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Fri, 13 Dec 2024 22:15:46 +0800
Subject: [PATCH 154/157] [core] Store `cardinality` in the deletion vector
 meta (#4699)

---
 docs/content/concepts/spec/manifest.md        |   8 +-
 .../deletionvectors/BitmapDeletionVector.java |   5 +
 .../DeletionVectorIndexFileWriter.java        |  15 ++-
 .../DeletionVectorsIndexFile.java             |  19 ++--
 .../paimon/index/DeletionVectorMeta.java      | 103 +++++++++++++++++
 .../apache/paimon/index/IndexFileHandler.java |  17 +--
 .../apache/paimon/index/IndexFileMeta.java    |  29 ++---
 .../index/IndexFileMeta09Serializer.java      | 104 ++++++++++++++++++
 .../paimon/index/IndexFileMetaSerializer.java |  39 ++++---
 .../paimon/manifest/IndexManifestEntry.java   |   8 +-
 .../IndexManifestEntrySerializer.java         |  12 +-
 .../table/sink/CommitMessageSerializer.java   |  78 ++++++-------
 .../apache/paimon/table/source/DataSplit.java |  29 +++--
 .../paimon/table/source/DeletionFile.java     |  57 ++++++++--
 .../source/snapshot/SnapshotReaderImpl.java   |  18 +--
 .../AppendDeletionFileMaintainerTest.java     |  15 +--
 .../index/IndexFileMetaSerializerTest.java    |  15 ++-
 ...ommittableSerializerCompatibilityTest.java |  96 +++++++++++++---
 .../sink/CommitMessageSerializerTest.java     |   2 +-
 .../apache/paimon/table/source/SplitTest.java |  68 ++++++++++++
 .../test/resources/compatibility/datasplit-v3 | Bin 0 -> 886 bytes
 .../compatibility/manifest-committable-v4     | Bin 0 -> 3145 bytes
 .../paimon/spark/sql/DeletionVectorTest.scala |  21 ++++
 23 files changed, 595 insertions(+), 163 deletions(-)
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/index/DeletionVectorMeta.java
 create mode 100644 paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta09Serializer.java
 create mode 100644 paimon-core/src/test/resources/compatibility/datasplit-v3
 create mode 100644 paimon-core/src/test/resources/compatibility/manifest-committable-v4

diff --git a/docs/content/concepts/spec/manifest.md b/docs/content/concepts/spec/manifest.md
index bc7318331a512..8460febf78655 100644
--- a/docs/content/concepts/spec/manifest.md
+++ b/docs/content/concepts/spec/manifest.md
@@ -111,5 +111,9 @@ The index file meta is:
 2. fileName: file name.
 3. fileSize: file size.
 4. rowCount: total number of rows.
-5. deletionVectorsRanges: Metadata only used by "DELETION_VECTORS", Stores offset and length of each data file,
-   The schema is `ARRAY<ROW<f0: STRING, f1: INT, f2: INT>>`.
+5. deletionVectorsRanges: Metadata only used by "DELETION_VECTORS", is an array of deletion vector meta, the schema of each deletion vector meta is:
+   1. f0: the data file name corresponding to this deletion vector.
+   2. f1: the starting offset of this deletion vector in the index file.
+   3. f2: the length of this deletion vector in the index file.
+   4. cardinality: the number of deleted rows.
+
diff --git a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/BitmapDeletionVector.java b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/BitmapDeletionVector.java
index a2c5925966464..51ae729c2193b 100644
--- a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/BitmapDeletionVector.java
+++ b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/BitmapDeletionVector.java
@@ -117,4 +117,9 @@ public boolean equals(Object o) {
         BitmapDeletionVector that = (BitmapDeletionVector) o;
         return Objects.equals(this.roaringBitmap, that.roaringBitmap);
     }
+
+    @Override
+    public int hashCode() {
+        return Objects.hashCode(roaringBitmap);
+    }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorIndexFileWriter.java b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorIndexFileWriter.java
index f8c8330f190ca..5246d35d4b31a 100644
--- a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorIndexFileWriter.java
+++ b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorIndexFileWriter.java
@@ -20,9 +20,9 @@
 
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.options.MemorySize;
-import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.PathFactory;
 import org.apache.paimon.utils.Preconditions;
 
@@ -104,13 +104,13 @@ private class SingleIndexFileWriter implements Closeable {
 
         private final Path path;
         private final DataOutputStream dataOutputStream;
-        private final LinkedHashMap<String, Pair<Integer, Integer>> dvRanges;
+        private final LinkedHashMap<String, DeletionVectorMeta> dvMetas;
 
         private SingleIndexFileWriter() throws IOException {
             this.path = indexPathFactory.newPath();
             this.dataOutputStream = new DataOutputStream(fileIO.newOutputStream(path, true));
             dataOutputStream.writeByte(VERSION_ID_V1);
-            this.dvRanges = new LinkedHashMap<>();
+            this.dvMetas = new LinkedHashMap<>();
         }
 
         private long writtenSizeInBytes() {
@@ -121,7 +121,10 @@ private void write(String key, DeletionVector deletionVector) throws IOException
             Preconditions.checkNotNull(dataOutputStream);
             byte[] data = deletionVector.serializeToBytes();
             int size = data.length;
-            dvRanges.put(key, Pair.of(dataOutputStream.size(), size));
+            dvMetas.put(
+                    key,
+                    new DeletionVectorMeta(
+                            key, dataOutputStream.size(), size, deletionVector.getCardinality()));
             dataOutputStream.writeInt(size);
             dataOutputStream.write(data);
             dataOutputStream.writeInt(calculateChecksum(data));
@@ -132,8 +135,8 @@ public IndexFileMeta writtenIndexFile() {
                     DELETION_VECTORS_INDEX,
                     path.getName(),
                     writtenSizeInBytes(),
-                    dvRanges.size(),
-                    dvRanges);
+                    dvMetas.size(),
+                    dvMetas);
         }
 
         @Override
diff --git a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorsIndexFile.java b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorsIndexFile.java
index 798404e001e52..77abb2d729859 100644
--- a/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorsIndexFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/deletionvectors/DeletionVectorsIndexFile.java
@@ -21,11 +21,11 @@
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.Path;
 import org.apache.paimon.fs.SeekableInputStream;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFile;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.options.MemorySize;
 import org.apache.paimon.table.source.DeletionFile;
-import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.PathFactory;
 
 import java.io.DataInputStream;
@@ -63,9 +63,9 @@ public DeletionVectorsIndexFile(
      * @throws UncheckedIOException If an I/O error occurs while reading from the file.
      */
     public Map<String, DeletionVector> readAllDeletionVectors(IndexFileMeta fileMeta) {
-        LinkedHashMap<String, Pair<Integer, Integer>> deletionVectorRanges =
-                fileMeta.deletionVectorsRanges();
-        checkNotNull(deletionVectorRanges);
+        LinkedHashMap<String, DeletionVectorMeta> deletionVectorMetas =
+                fileMeta.deletionVectorMetas();
+        checkNotNull(deletionVectorMetas);
 
         String indexFileName = fileMeta.fileName();
         Map<String, DeletionVector> deletionVectors = new HashMap<>();
@@ -73,18 +73,17 @@ public Map<String, DeletionVector> readAllDeletionVectors(IndexFileMeta fileMeta
         try (SeekableInputStream inputStream = fileIO.newInputStream(filePath)) {
             checkVersion(inputStream);
             DataInputStream dataInputStream = new DataInputStream(inputStream);
-            for (Map.Entry<String, Pair<Integer, Integer>> entry :
-                    deletionVectorRanges.entrySet()) {
+            for (DeletionVectorMeta deletionVectorMeta : deletionVectorMetas.values()) {
                 deletionVectors.put(
-                        entry.getKey(),
-                        readDeletionVector(dataInputStream, entry.getValue().getRight()));
+                        deletionVectorMeta.dataFileName(),
+                        readDeletionVector(dataInputStream, deletionVectorMeta.length()));
             }
         } catch (Exception e) {
             throw new RuntimeException(
                     "Unable to read deletion vectors from file: "
                             + filePath
-                            + ", deletionVectorRanges: "
-                            + deletionVectorRanges,
+                            + ", deletionVectorMetas: "
+                            + deletionVectorMetas,
                     e);
         }
         return deletionVectors;
diff --git a/paimon-core/src/main/java/org/apache/paimon/index/DeletionVectorMeta.java b/paimon-core/src/main/java/org/apache/paimon/index/DeletionVectorMeta.java
new file mode 100644
index 0000000000000..9eb38818f694f
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/index/DeletionVectorMeta.java
@@ -0,0 +1,103 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.index;
+
+import org.apache.paimon.types.BigIntType;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.IntType;
+import org.apache.paimon.types.RowType;
+
+import javax.annotation.Nullable;
+
+import java.util.Objects;
+
+import static org.apache.paimon.utils.SerializationUtils.newStringType;
+
+/** Metadata of deletion vector. */
+public class DeletionVectorMeta {
+
+    public static final RowType SCHEMA =
+            RowType.of(
+                    new DataField(0, "f0", newStringType(false)),
+                    new DataField(1, "f1", new IntType(false)),
+                    new DataField(2, "f2", new IntType(false)),
+                    new DataField(3, "_CARDINALITY", new BigIntType(true)));
+
+    private final String dataFileName;
+    private final int offset;
+    private final int length;
+    @Nullable private final Long cardinality;
+
+    public DeletionVectorMeta(
+            String dataFileName, int start, int size, @Nullable Long cardinality) {
+        this.dataFileName = dataFileName;
+        this.offset = start;
+        this.length = size;
+        this.cardinality = cardinality;
+    }
+
+    public String dataFileName() {
+        return dataFileName;
+    }
+
+    public int offset() {
+        return offset;
+    }
+
+    public int length() {
+        return length;
+    }
+
+    @Nullable
+    public Long cardinality() {
+        return cardinality;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (o == null || getClass() != o.getClass()) {
+            return false;
+        }
+        DeletionVectorMeta that = (DeletionVectorMeta) o;
+        return offset == that.offset
+                && length == that.length
+                && Objects.equals(dataFileName, that.dataFileName)
+                && Objects.equals(cardinality, that.cardinality);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(dataFileName, offset, length, cardinality);
+    }
+
+    @Override
+    public String toString() {
+        return "DeletionVectorMeta{"
+                + "dataFileName='"
+                + dataFileName
+                + '\''
+                + ", offset="
+                + offset
+                + ", length="
+                + length
+                + ", cardinality="
+                + cardinality
+                + '}';
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileHandler.java b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileHandler.java
index 7e5efccdd813a..8b0e5c5021f68 100644
--- a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileHandler.java
+++ b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileHandler.java
@@ -100,15 +100,16 @@ public Map<String, DeletionFile> scanDVIndex(
             if (meta.indexType().equals(DELETION_VECTORS_INDEX)
                     && file.partition().equals(partition)
                     && file.bucket() == bucket) {
-                LinkedHashMap<String, Pair<Integer, Integer>> dvRanges =
-                        meta.deletionVectorsRanges();
-                checkNotNull(dvRanges);
-                for (String dataFile : dvRanges.keySet()) {
-                    Pair<Integer, Integer> pair = dvRanges.get(dataFile);
-                    DeletionFile deletionFile =
+                LinkedHashMap<String, DeletionVectorMeta> dvMetas = meta.deletionVectorMetas();
+                checkNotNull(dvMetas);
+                for (DeletionVectorMeta dvMeta : dvMetas.values()) {
+                    result.put(
+                            dvMeta.dataFileName(),
                             new DeletionFile(
-                                    filePath(meta).toString(), pair.getLeft(), pair.getRight());
-                    result.put(dataFile, deletionFile);
+                                    filePath(meta).toString(),
+                                    dvMeta.offset(),
+                                    dvMeta.length(),
+                                    dvMeta.cardinality()));
                 }
             }
         }
diff --git a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta.java b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta.java
index 24ba6992a5d9c..aae4f8c4731bd 100644
--- a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta.java
+++ b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta.java
@@ -23,9 +23,7 @@
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.BigIntType;
 import org.apache.paimon.types.DataField;
-import org.apache.paimon.types.IntType;
 import org.apache.paimon.types.RowType;
-import org.apache.paimon.utils.Pair;
 
 import javax.annotation.Nullable;
 
@@ -54,12 +52,7 @@ public class IndexFileMeta {
                             new DataField(
                                     4,
                                     "_DELETIONS_VECTORS_RANGES",
-                                    new ArrayType(
-                                            true,
-                                            RowType.of(
-                                                    newStringType(false),
-                                                    new IntType(false),
-                                                    new IntType(false))))));
+                                    new ArrayType(true, DeletionVectorMeta.SCHEMA))));
 
     private final String indexType;
     private final String fileName;
@@ -68,9 +61,9 @@ public class IndexFileMeta {
 
     /**
      * Metadata only used by {@link DeletionVectorsIndexFile}, use LinkedHashMap to ensure that the
-     * order of DeletionVectorRanges and the written DeletionVectors is consistent.
+     * order of DeletionVectorMetas and the written DeletionVectors is consistent.
      */
-    private final @Nullable LinkedHashMap<String, Pair<Integer, Integer>> deletionVectorsRanges;
+    private final @Nullable LinkedHashMap<String, DeletionVectorMeta> deletionVectorMetas;
 
     public IndexFileMeta(String indexType, String fileName, long fileSize, long rowCount) {
         this(indexType, fileName, fileSize, rowCount, null);
@@ -81,12 +74,12 @@ public IndexFileMeta(
             String fileName,
             long fileSize,
             long rowCount,
-            @Nullable LinkedHashMap<String, Pair<Integer, Integer>> deletionVectorsRanges) {
+            @Nullable LinkedHashMap<String, DeletionVectorMeta> deletionVectorMetas) {
         this.indexType = indexType;
         this.fileName = fileName;
         this.fileSize = fileSize;
         this.rowCount = rowCount;
-        this.deletionVectorsRanges = deletionVectorsRanges;
+        this.deletionVectorMetas = deletionVectorMetas;
     }
 
     public String indexType() {
@@ -105,8 +98,8 @@ public long rowCount() {
         return rowCount;
     }
 
-    public @Nullable LinkedHashMap<String, Pair<Integer, Integer>> deletionVectorsRanges() {
-        return deletionVectorsRanges;
+    public @Nullable LinkedHashMap<String, DeletionVectorMeta> deletionVectorMetas() {
+        return deletionVectorMetas;
     }
 
     @Override
@@ -122,12 +115,12 @@ public boolean equals(Object o) {
                 && Objects.equals(fileName, that.fileName)
                 && fileSize == that.fileSize
                 && rowCount == that.rowCount
-                && Objects.equals(deletionVectorsRanges, that.deletionVectorsRanges);
+                && Objects.equals(deletionVectorMetas, that.deletionVectorMetas);
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(indexType, fileName, fileSize, rowCount, deletionVectorsRanges);
+        return Objects.hash(indexType, fileName, fileSize, rowCount, deletionVectorMetas);
     }
 
     @Override
@@ -142,8 +135,8 @@ public String toString() {
                 + fileSize
                 + ", rowCount="
                 + rowCount
-                + ", deletionVectorsRanges="
-                + deletionVectorsRanges
+                + ", deletionVectorMetas="
+                + deletionVectorMetas
                 + '}';
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta09Serializer.java b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta09Serializer.java
new file mode 100644
index 0000000000000..915d904569d70
--- /dev/null
+++ b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMeta09Serializer.java
@@ -0,0 +1,104 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.index;
+
+import org.apache.paimon.data.InternalArray;
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.data.serializer.InternalRowSerializer;
+import org.apache.paimon.data.serializer.InternalSerializers;
+import org.apache.paimon.io.DataInputView;
+import org.apache.paimon.types.ArrayType;
+import org.apache.paimon.types.BigIntType;
+import org.apache.paimon.types.DataField;
+import org.apache.paimon.types.IntType;
+import org.apache.paimon.types.RowType;
+
+import java.io.IOException;
+import java.io.Serializable;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.LinkedHashMap;
+import java.util.List;
+
+import static org.apache.paimon.utils.SerializationUtils.newStringType;
+
+/** Serializer for {@link IndexFileMeta} with 0.9 version. */
+public class IndexFileMeta09Serializer implements Serializable {
+
+    private static final long serialVersionUID = 1L;
+
+    public static final RowType SCHEMA =
+            new RowType(
+                    false,
+                    Arrays.asList(
+                            new DataField(0, "_INDEX_TYPE", newStringType(false)),
+                            new DataField(1, "_FILE_NAME", newStringType(false)),
+                            new DataField(2, "_FILE_SIZE", new BigIntType(false)),
+                            new DataField(3, "_ROW_COUNT", new BigIntType(false)),
+                            new DataField(
+                                    4,
+                                    "_DELETIONS_VECTORS_RANGES",
+                                    new ArrayType(
+                                            true,
+                                            RowType.of(
+                                                    newStringType(false),
+                                                    new IntType(false),
+                                                    new IntType(false))))));
+
+    protected final InternalRowSerializer rowSerializer;
+
+    public IndexFileMeta09Serializer() {
+        this.rowSerializer = InternalSerializers.create(SCHEMA);
+    }
+
+    public IndexFileMeta fromRow(InternalRow row) {
+        return new IndexFileMeta(
+                row.getString(0).toString(),
+                row.getString(1).toString(),
+                row.getLong(2),
+                row.getLong(3),
+                row.isNullAt(4) ? null : rowArrayDataToDvMetas(row.getArray(4)));
+    }
+
+    public final List<IndexFileMeta> deserializeList(DataInputView source) throws IOException {
+        int size = source.readInt();
+        List<IndexFileMeta> records = new ArrayList<>(size);
+        for (int i = 0; i < size; i++) {
+            records.add(deserialize(source));
+        }
+        return records;
+    }
+
+    public IndexFileMeta deserialize(DataInputView in) throws IOException {
+        return fromRow(rowSerializer.deserialize(in));
+    }
+
+    public static LinkedHashMap<String, DeletionVectorMeta> rowArrayDataToDvMetas(
+            InternalArray arrayData) {
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>(arrayData.size());
+        for (int i = 0; i < arrayData.size(); i++) {
+            InternalRow row = arrayData.getRow(i, 3);
+            dvMetas.put(
+                    row.getString(0).toString(),
+                    new DeletionVectorMeta(
+                            row.getString(0).toString(), row.getInt(1), row.getInt(2), null));
+        }
+        return dvMetas;
+    }
+}
diff --git a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMetaSerializer.java b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMetaSerializer.java
index 4b52932623f2a..db4a44838fbf2 100644
--- a/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMetaSerializer.java
+++ b/paimon-core/src/main/java/org/apache/paimon/index/IndexFileMetaSerializer.java
@@ -24,9 +24,9 @@
 import org.apache.paimon.data.InternalArray;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.utils.ObjectSerializer;
-import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.VersionedObjectSerializer;
 
+import java.util.Collection;
 import java.util.LinkedHashMap;
 
 /** A {@link VersionedObjectSerializer} for {@link IndexFileMeta}. */
@@ -43,9 +43,9 @@ public InternalRow toRow(IndexFileMeta record) {
                 BinaryString.fromString(record.fileName()),
                 record.fileSize(),
                 record.rowCount(),
-                record.deletionVectorsRanges() == null
+                record.deletionVectorMetas() == null
                         ? null
-                        : dvRangesToRowArrayData(record.deletionVectorsRanges()));
+                        : dvMetasToRowArrayData(record.deletionVectorMetas().values()));
     }
 
     @Override
@@ -55,30 +55,35 @@ public IndexFileMeta fromRow(InternalRow row) {
                 row.getString(1).toString(),
                 row.getLong(2),
                 row.getLong(3),
-                row.isNullAt(4) ? null : rowArrayDataToDvRanges(row.getArray(4)));
+                row.isNullAt(4) ? null : rowArrayDataToDvMetas(row.getArray(4)));
     }
 
-    public static InternalArray dvRangesToRowArrayData(
-            LinkedHashMap<String, Pair<Integer, Integer>> dvRanges) {
+    public static InternalArray dvMetasToRowArrayData(Collection<DeletionVectorMeta> dvMetas) {
         return new GenericArray(
-                dvRanges.entrySet().stream()
+                dvMetas.stream()
                         .map(
-                                entry ->
+                                dvMeta ->
                                         GenericRow.of(
-                                                BinaryString.fromString(entry.getKey()),
-                                                entry.getValue().getLeft(),
-                                                entry.getValue().getRight()))
+                                                BinaryString.fromString(dvMeta.dataFileName()),
+                                                dvMeta.offset(),
+                                                dvMeta.length(),
+                                                dvMeta.cardinality()))
                         .toArray(GenericRow[]::new));
     }
 
-    public static LinkedHashMap<String, Pair<Integer, Integer>> rowArrayDataToDvRanges(
+    public static LinkedHashMap<String, DeletionVectorMeta> rowArrayDataToDvMetas(
             InternalArray arrayData) {
-        LinkedHashMap<String, Pair<Integer, Integer>> dvRanges =
-                new LinkedHashMap<>(arrayData.size());
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>(arrayData.size());
         for (int i = 0; i < arrayData.size(); i++) {
-            InternalRow row = arrayData.getRow(i, 3);
-            dvRanges.put(row.getString(0).toString(), Pair.of(row.getInt(1), row.getInt(2)));
+            InternalRow row = arrayData.getRow(i, DeletionVectorMeta.SCHEMA.getFieldCount());
+            dvMetas.put(
+                    row.getString(0).toString(),
+                    new DeletionVectorMeta(
+                            row.getString(0).toString(),
+                            row.getInt(1),
+                            row.getInt(2),
+                            row.isNullAt(3) ? null : row.getLong(3)));
         }
-        return dvRanges;
+        return dvMetas;
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntry.java b/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntry.java
index a52d9e8af40f2..2431a1c26412f 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntry.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntry.java
@@ -20,6 +20,7 @@
 
 import org.apache.paimon.annotation.Public;
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.types.ArrayType;
 import org.apache.paimon.types.BigIntType;
@@ -57,12 +58,7 @@ public class IndexManifestEntry {
                             new DataField(
                                     7,
                                     "_DELETIONS_VECTORS_RANGES",
-                                    new ArrayType(
-                                            true,
-                                            RowType.of(
-                                                    newStringType(false),
-                                                    new IntType(false),
-                                                    new IntType(false))))));
+                                    new ArrayType(true, DeletionVectorMeta.SCHEMA))));
 
     private final FileKind kind;
     private final BinaryRow partition;
diff --git a/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntrySerializer.java b/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntrySerializer.java
index 574e935550eb6..6f2ec17dda8c8 100644
--- a/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntrySerializer.java
+++ b/paimon-core/src/main/java/org/apache/paimon/manifest/IndexManifestEntrySerializer.java
@@ -22,10 +22,9 @@
 import org.apache.paimon.data.GenericRow;
 import org.apache.paimon.data.InternalRow;
 import org.apache.paimon.index.IndexFileMeta;
+import org.apache.paimon.index.IndexFileMetaSerializer;
 import org.apache.paimon.utils.VersionedObjectSerializer;
 
-import static org.apache.paimon.index.IndexFileMetaSerializer.dvRangesToRowArrayData;
-import static org.apache.paimon.index.IndexFileMetaSerializer.rowArrayDataToDvRanges;
 import static org.apache.paimon.utils.SerializationUtils.deserializeBinaryRow;
 import static org.apache.paimon.utils.SerializationUtils.serializeBinaryRow;
 
@@ -52,9 +51,10 @@ public InternalRow convertTo(IndexManifestEntry record) {
                 BinaryString.fromString(indexFile.fileName()),
                 indexFile.fileSize(),
                 indexFile.rowCount(),
-                record.indexFile().deletionVectorsRanges() == null
+                record.indexFile().deletionVectorMetas() == null
                         ? null
-                        : dvRangesToRowArrayData(record.indexFile().deletionVectorsRanges()));
+                        : IndexFileMetaSerializer.dvMetasToRowArrayData(
+                                record.indexFile().deletionVectorMetas().values()));
     }
 
     @Override
@@ -72,6 +72,8 @@ public IndexManifestEntry convertFrom(int version, InternalRow row) {
                         row.getString(4).toString(),
                         row.getLong(5),
                         row.getLong(6),
-                        row.isNullAt(7) ? null : rowArrayDataToDvRanges(row.getArray(7))));
+                        row.isNullAt(7)
+                                ? null
+                                : IndexFileMetaSerializer.rowArrayDataToDvMetas(row.getArray(7))));
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/sink/CommitMessageSerializer.java b/paimon-core/src/main/java/org/apache/paimon/table/sink/CommitMessageSerializer.java
index 7918914b2c635..9fc251c366729 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/sink/CommitMessageSerializer.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/sink/CommitMessageSerializer.java
@@ -19,6 +19,8 @@
 package org.apache.paimon.table.sink;
 
 import org.apache.paimon.data.serializer.VersionedSerializer;
+import org.apache.paimon.index.IndexFileMeta;
+import org.apache.paimon.index.IndexFileMeta09Serializer;
 import org.apache.paimon.index.IndexFileMetaSerializer;
 import org.apache.paimon.io.CompactIncrement;
 import org.apache.paimon.io.DataFileMeta;
@@ -45,12 +47,14 @@
 /** {@link VersionedSerializer} for {@link CommitMessage}. */
 public class CommitMessageSerializer implements VersionedSerializer<CommitMessage> {
 
-    private static final int CURRENT_VERSION = 4;
+    private static final int CURRENT_VERSION = 5;
 
     private final DataFileMetaSerializer dataFileSerializer;
     private final IndexFileMetaSerializer indexEntrySerializer;
 
+    private DataFileMeta09Serializer dataFile09Serializer;
     private DataFileMeta08Serializer dataFile08Serializer;
+    private IndexFileMeta09Serializer indexEntry09Serializer;
 
     public CommitMessageSerializer() {
         this.dataFileSerializer = new DataFileMetaSerializer();
@@ -107,48 +111,48 @@ public List<CommitMessage> deserializeList(int version, DataInputView view) thro
     }
 
     private CommitMessage deserialize(int version, DataInputView view) throws IOException {
-        if (version >= 3) {
-            IOExceptionSupplier<List<DataFileMeta>> fileDeserializer =
-                    () -> dataFileSerializer.deserializeList(view);
-            if (version == 3) {
-                DataFileMeta09Serializer serializer = new DataFileMeta09Serializer();
-                fileDeserializer = () -> serializer.deserializeList(view);
-            }
-            return new CommitMessageImpl(
-                    deserializeBinaryRow(view),
-                    view.readInt(),
-                    new DataIncrement(
-                            fileDeserializer.get(), fileDeserializer.get(), fileDeserializer.get()),
-                    new CompactIncrement(
-                            fileDeserializer.get(), fileDeserializer.get(), fileDeserializer.get()),
-                    new IndexIncrement(
-                            indexEntrySerializer.deserializeList(view),
-                            indexEntrySerializer.deserializeList(view)));
-        } else {
-            return deserialize08(version, view);
-        }
-    }
-
-    private CommitMessage deserialize08(int version, DataInputView view) throws IOException {
-        if (dataFile08Serializer == null) {
-            dataFile08Serializer = new DataFileMeta08Serializer();
-        }
+        IOExceptionSupplier<List<DataFileMeta>> fileDeserializer = fileDeserializer(version, view);
+        IOExceptionSupplier<List<IndexFileMeta>> indexEntryDeserializer =
+                indexEntryDeserializer(version, view);
 
         return new CommitMessageImpl(
                 deserializeBinaryRow(view),
                 view.readInt(),
                 new DataIncrement(
-                        dataFile08Serializer.deserializeList(view),
-                        dataFile08Serializer.deserializeList(view),
-                        dataFile08Serializer.deserializeList(view)),
+                        fileDeserializer.get(), fileDeserializer.get(), fileDeserializer.get()),
                 new CompactIncrement(
-                        dataFile08Serializer.deserializeList(view),
-                        dataFile08Serializer.deserializeList(view),
-                        dataFile08Serializer.deserializeList(view)),
+                        fileDeserializer.get(), fileDeserializer.get(), fileDeserializer.get()),
                 new IndexIncrement(
-                        indexEntrySerializer.deserializeList(view),
-                        version <= 2
-                                ? Collections.emptyList()
-                                : indexEntrySerializer.deserializeList(view)));
+                        indexEntryDeserializer.get(),
+                        version <= 2 ? Collections.emptyList() : indexEntryDeserializer.get()));
+    }
+
+    private IOExceptionSupplier<List<DataFileMeta>> fileDeserializer(
+            int version, DataInputView view) {
+        if (version >= 4) {
+            return () -> dataFileSerializer.deserializeList(view);
+        } else if (version == 3) {
+            if (dataFile09Serializer == null) {
+                dataFile09Serializer = new DataFileMeta09Serializer();
+            }
+            return () -> dataFile09Serializer.deserializeList(view);
+        } else {
+            if (dataFile08Serializer == null) {
+                dataFile08Serializer = new DataFileMeta08Serializer();
+            }
+            return () -> dataFile08Serializer.deserializeList(view);
+        }
+    }
+
+    private IOExceptionSupplier<List<IndexFileMeta>> indexEntryDeserializer(
+            int version, DataInputView view) {
+        if (version >= 5) {
+            return () -> indexEntrySerializer.deserializeList(view);
+        } else {
+            if (indexEntry09Serializer == null) {
+                indexEntry09Serializer = new IndexFileMeta09Serializer();
+            }
+            return () -> indexEntry09Serializer.deserializeList(view);
+        }
     }
 }
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
index 1dac6584d6988..29405466b93f1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
@@ -50,7 +50,7 @@ public class DataSplit implements Split {
 
     private static final long serialVersionUID = 7L;
     private static final long MAGIC = -2394839472490812314L;
-    private static final int VERSION = 3;
+    private static final int VERSION = 4;
 
     private long snapshotId = 0;
     private BinaryRow partition;
@@ -272,13 +272,16 @@ public static DataSplit deserialize(DataInputView in) throws IOException {
 
         FunctionWithIOException<DataInputView, DataFileMeta> dataFileSer =
                 getFileMetaSerde(version);
+        FunctionWithIOException<DataInputView, DeletionFile> deletionFileSerde =
+                getDeletionFileSerde(version);
         int beforeNumber = in.readInt();
         List<DataFileMeta> beforeFiles = new ArrayList<>(beforeNumber);
         for (int i = 0; i < beforeNumber; i++) {
             beforeFiles.add(dataFileSer.apply(in));
         }
 
-        List<DeletionFile> beforeDeletionFiles = DeletionFile.deserializeList(in);
+        List<DeletionFile> beforeDeletionFiles =
+                DeletionFile.deserializeList(in, deletionFileSerde);
 
         int fileNumber = in.readInt();
         List<DataFileMeta> dataFiles = new ArrayList<>(fileNumber);
@@ -286,7 +289,7 @@ public static DataSplit deserialize(DataInputView in) throws IOException {
             dataFiles.add(dataFileSer.apply(in));
         }
 
-        List<DeletionFile> dataDeletionFiles = DeletionFile.deserializeList(in);
+        List<DeletionFile> dataDeletionFiles = DeletionFile.deserializeList(in, deletionFileSerde);
 
         boolean isStreaming = in.readBoolean();
         boolean rawConvertible = in.readBoolean();
@@ -319,16 +322,22 @@ private static FunctionWithIOException<DataInputView, DataFileMeta> getFileMetaS
         } else if (version == 2) {
             DataFileMeta09Serializer serializer = new DataFileMeta09Serializer();
             return serializer::deserialize;
-        } else if (version == 3) {
+        } else if (version >= 3) {
             DataFileMetaSerializer serializer = new DataFileMetaSerializer();
             return serializer::deserialize;
         } else {
-            throw new UnsupportedOperationException(
-                    "Expecting DataSplit version to be smaller or equal than "
-                            + VERSION
-                            + ", but found "
-                            + version
-                            + ".");
+            throw new UnsupportedOperationException("Unsupported version: " + version);
+        }
+    }
+
+    private static FunctionWithIOException<DataInputView, DeletionFile> getDeletionFileSerde(
+            int version) {
+        if (version >= 1 && version <= 3) {
+            return DeletionFile::deserializeV3;
+        } else if (version >= 4) {
+            return DeletionFile::deserialize;
+        } else {
+            throw new UnsupportedOperationException("Unsupported version: " + version);
         }
     }
 
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DeletionFile.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DeletionFile.java
index 94dfc615729c8..5bcf6898ed991 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DeletionFile.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DeletionFile.java
@@ -22,6 +22,7 @@
 import org.apache.paimon.io.DataFileMeta;
 import org.apache.paimon.io.DataInputView;
 import org.apache.paimon.io.DataOutputView;
+import org.apache.paimon.utils.FunctionWithIOException;
 
 import javax.annotation.Nullable;
 
@@ -52,11 +53,13 @@ public class DeletionFile implements Serializable {
     private final String path;
     private final long offset;
     private final long length;
+    @Nullable private final Long cardinality;
 
-    public DeletionFile(String path, long offset, long length) {
+    public DeletionFile(String path, long offset, long length, @Nullable Long cardinality) {
         this.path = path;
         this.offset = offset;
         this.length = length;
+        this.cardinality = cardinality;
     }
 
     /** Path of the file. */
@@ -74,6 +77,12 @@ public long length() {
         return length;
     }
 
+    /** the number of deleted rows. */
+    @Nullable
+    public Long cardinality() {
+        return cardinality;
+    }
+
     public static void serialize(DataOutputView out, @Nullable DeletionFile file)
             throws IOException {
         if (file == null) {
@@ -83,6 +92,7 @@ public static void serialize(DataOutputView out, @Nullable DeletionFile file)
             out.writeUTF(file.path);
             out.writeLong(file.offset);
             out.writeLong(file.length);
+            out.writeLong(file.cardinality == null ? -1 : file.cardinality);
         }
     }
 
@@ -108,17 +118,32 @@ public static DeletionFile deserialize(DataInputView in) throws IOException {
         String path = in.readUTF();
         long offset = in.readLong();
         long length = in.readLong();
-        return new DeletionFile(path, offset, length);
+        long cardinality = in.readLong();
+        return new DeletionFile(path, offset, length, cardinality == -1 ? null : cardinality);
     }
 
     @Nullable
-    public static List<DeletionFile> deserializeList(DataInputView in) throws IOException {
+    public static DeletionFile deserializeV3(DataInputView in) throws IOException {
+        if (in.readByte() == 0) {
+            return null;
+        }
+
+        String path = in.readUTF();
+        long offset = in.readLong();
+        long length = in.readLong();
+        return new DeletionFile(path, offset, length, null);
+    }
+
+    @Nullable
+    public static List<DeletionFile> deserializeList(
+            DataInputView in, FunctionWithIOException<DataInputView, DeletionFile> deserialize)
+            throws IOException {
         List<DeletionFile> files = null;
         if (in.readByte() == 1) {
             int size = in.readInt();
             files = new ArrayList<>(size);
             for (int i = 0; i < size; i++) {
-                files.add(DeletionFile.deserialize(in));
+                files.add(deserialize.apply(in));
             }
         }
         return files;
@@ -126,22 +151,34 @@ public static List<DeletionFile> deserializeList(DataInputView in) throws IOExce
 
     @Override
     public boolean equals(Object o) {
-        if (!(o instanceof DeletionFile)) {
+        if (o == null || getClass() != o.getClass()) {
             return false;
         }
-
-        DeletionFile other = (DeletionFile) o;
-        return Objects.equals(path, other.path) && offset == other.offset && length == other.length;
+        DeletionFile that = (DeletionFile) o;
+        return offset == that.offset
+                && length == that.length
+                && Objects.equals(path, that.path)
+                && Objects.equals(cardinality, that.cardinality);
     }
 
     @Override
     public int hashCode() {
-        return Objects.hash(path, offset, length);
+        return Objects.hash(path, offset, length, cardinality);
     }
 
     @Override
     public String toString() {
-        return String.format("{path = %s, offset = %d, length = %d}", path, offset, length);
+        return "DeletionFile{"
+                + "path='"
+                + path
+                + '\''
+                + ", offset="
+                + offset
+                + ", length="
+                + length
+                + ", cardinality="
+                + cardinality
+                + '}';
     }
 
     static Factory emptyFactory() {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
index ce01bdba94476..bf19ba10c6899 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/snapshot/SnapshotReaderImpl.java
@@ -24,6 +24,7 @@
 import org.apache.paimon.codegen.RecordComparator;
 import org.apache.paimon.consumer.ConsumerManager;
 import org.apache.paimon.data.BinaryRow;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFileHandler;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.io.DataFileMeta;
@@ -492,23 +493,24 @@ private List<DeletionFile> getDeletionFiles(
         List<DeletionFile> deletionFiles = new ArrayList<>(dataFiles.size());
         Map<String, IndexFileMeta> dataFileToIndexFileMeta = new HashMap<>();
         for (IndexFileMeta indexFileMeta : indexFileMetas) {
-            if (indexFileMeta.deletionVectorsRanges() != null) {
-                for (String dataFileName : indexFileMeta.deletionVectorsRanges().keySet()) {
-                    dataFileToIndexFileMeta.put(dataFileName, indexFileMeta);
+            if (indexFileMeta.deletionVectorMetas() != null) {
+                for (DeletionVectorMeta dvMeta : indexFileMeta.deletionVectorMetas().values()) {
+                    dataFileToIndexFileMeta.put(dvMeta.dataFileName(), indexFileMeta);
                 }
             }
         }
         for (DataFileMeta file : dataFiles) {
             IndexFileMeta indexFileMeta = dataFileToIndexFileMeta.get(file.fileName());
             if (indexFileMeta != null) {
-                Map<String, Pair<Integer, Integer>> ranges = indexFileMeta.deletionVectorsRanges();
-                if (ranges != null && ranges.containsKey(file.fileName())) {
-                    Pair<Integer, Integer> range = ranges.get(file.fileName());
+                LinkedHashMap<String, DeletionVectorMeta> dvMetas =
+                        indexFileMeta.deletionVectorMetas();
+                if (dvMetas != null && dvMetas.containsKey(file.fileName())) {
                     deletionFiles.add(
                             new DeletionFile(
                                     indexFileHandler.filePath(indexFileMeta).toString(),
-                                    range.getKey(),
-                                    range.getValue()));
+                                    dvMetas.get(file.fileName()).offset(),
+                                    dvMetas.get(file.fileName()).length(),
+                                    dvMetas.get(file.fileName()).cardinality()));
                     continue;
                 }
             }
diff --git a/paimon-core/src/test/java/org/apache/paimon/deletionvectors/append/AppendDeletionFileMaintainerTest.java b/paimon-core/src/test/java/org/apache/paimon/deletionvectors/append/AppendDeletionFileMaintainerTest.java
index 6c674352b8d3c..a52819c805150 100644
--- a/paimon-core/src/test/java/org/apache/paimon/deletionvectors/append/AppendDeletionFileMaintainerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/deletionvectors/append/AppendDeletionFileMaintainerTest.java
@@ -23,12 +23,12 @@
 import org.apache.paimon.deletionvectors.DeletionVector;
 import org.apache.paimon.fs.FileIO;
 import org.apache.paimon.fs.local.LocalFileIO;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.manifest.FileKind;
 import org.apache.paimon.manifest.IndexManifestEntry;
 import org.apache.paimon.table.sink.CommitMessageImpl;
 import org.apache.paimon.table.source.DeletionFile;
-import org.apache.paimon.utils.Pair;
 import org.apache.paimon.utils.PathFactory;
 
 import org.junit.jupiter.api.Test;
@@ -94,7 +94,7 @@ public void test() throws Exception {
         assertThat(res.size()).isEqualTo(3);
         IndexManifestEntry entry =
                 res.stream().filter(file -> file.kind() == FileKind.ADD).findAny().get();
-        assertThat(entry.indexFile().deletionVectorsRanges().containsKey("f2")).isTrue();
+        assertThat(entry.indexFile().deletionVectorMetas().containsKey("f2")).isTrue();
         entry =
                 res.stream()
                         .filter(file -> file.kind() == FileKind.DELETE)
@@ -117,14 +117,15 @@ private Map<String, DeletionFile> createDeletionFileMapFromIndexFileMetas(
             PathFactory indexPathFactory, List<IndexFileMeta> fileMetas) {
         Map<String, DeletionFile> dataFileToDeletionFiles = new HashMap<>();
         for (IndexFileMeta indexFileMeta : fileMetas) {
-            for (Map.Entry<String, Pair<Integer, Integer>> range :
-                    indexFileMeta.deletionVectorsRanges().entrySet()) {
+            for (Map.Entry<String, DeletionVectorMeta> dvMeta :
+                    indexFileMeta.deletionVectorMetas().entrySet()) {
                 dataFileToDeletionFiles.put(
-                        range.getKey(),
+                        dvMeta.getKey(),
                         new DeletionFile(
                                 indexPathFactory.toPath(indexFileMeta.fileName()).toString(),
-                                range.getValue().getLeft(),
-                                range.getValue().getRight()));
+                                dvMeta.getValue().offset(),
+                                dvMeta.getValue().length(),
+                                dvMeta.getValue().cardinality()));
             }
         }
         return dataFileToDeletionFiles;
diff --git a/paimon-core/src/test/java/org/apache/paimon/index/IndexFileMetaSerializerTest.java b/paimon-core/src/test/java/org/apache/paimon/index/IndexFileMetaSerializerTest.java
index 724d5b416359d..a7e692d2e554d 100644
--- a/paimon-core/src/test/java/org/apache/paimon/index/IndexFileMetaSerializerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/index/IndexFileMetaSerializerTest.java
@@ -21,7 +21,6 @@
 import org.apache.paimon.deletionvectors.DeletionVectorsIndexFile;
 import org.apache.paimon.utils.ObjectSerializer;
 import org.apache.paimon.utils.ObjectSerializerTestBase;
-import org.apache.paimon.utils.Pair;
 
 import java.util.LinkedHashMap;
 import java.util.Random;
@@ -59,14 +58,20 @@ public static IndexFileMeta randomHashIndexFile() {
 
     public static IndexFileMeta randomDeletionVectorIndexFile() {
         Random rnd = new Random();
-        LinkedHashMap<String, Pair<Integer, Integer>> deletionVectorsRanges = new LinkedHashMap<>();
-        deletionVectorsRanges.put("my_file_name1", Pair.of(rnd.nextInt(), rnd.nextInt()));
-        deletionVectorsRanges.put("my_file_name2", Pair.of(rnd.nextInt(), rnd.nextInt()));
+        LinkedHashMap<String, DeletionVectorMeta> deletionVectorMetas = new LinkedHashMap<>();
+        deletionVectorMetas.put(
+                "my_file_name1",
+                new DeletionVectorMeta(
+                        "my_file_name1", rnd.nextInt(), rnd.nextInt(), rnd.nextLong()));
+        deletionVectorMetas.put(
+                "my_file_name2",
+                new DeletionVectorMeta(
+                        "my_file_name2", rnd.nextInt(), rnd.nextInt(), rnd.nextLong()));
         return new IndexFileMeta(
                 DeletionVectorsIndexFile.DELETION_VECTORS_INDEX,
                 "deletion_vectors_index_file_name" + rnd.nextLong(),
                 rnd.nextInt(),
                 rnd.nextInt(),
-                deletionVectorsRanges);
+                deletionVectorMetas);
     }
 }
diff --git a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerCompatibilityTest.java b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerCompatibilityTest.java
index bd272b745dc44..fbc02b2d73f2e 100644
--- a/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerCompatibilityTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/manifest/ManifestCommittableSerializerCompatibilityTest.java
@@ -19,6 +19,7 @@
 package org.apache.paimon.manifest;
 
 import org.apache.paimon.data.Timestamp;
+import org.apache.paimon.index.DeletionVectorMeta;
 import org.apache.paimon.index.IndexFileMeta;
 import org.apache.paimon.io.CompactIncrement;
 import org.apache.paimon.io.DataFileMeta;
@@ -27,7 +28,6 @@
 import org.apache.paimon.stats.SimpleStats;
 import org.apache.paimon.table.sink.CommitMessageImpl;
 import org.apache.paimon.utils.IOUtils;
-import org.apache.paimon.utils.Pair;
 
 import org.junit.jupiter.api.Test;
 
@@ -78,11 +78,11 @@ public void testProduction() throws IOException {
                         Arrays.asList("field1", "field2", "field3"));
         List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
 
-        LinkedHashMap<String, Pair<Integer, Integer>> dvRanges = new LinkedHashMap<>();
-        dvRanges.put("dv_key1", Pair.of(1, 2));
-        dvRanges.put("dv_key2", Pair.of(3, 4));
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>();
+        dvMetas.put("dv_key1", new DeletionVectorMeta("dv_key1", 1, 2, 3L));
+        dvMetas.put("dv_key2", new DeletionVectorMeta("dv_key2", 3, 4, 5L));
         IndexFileMeta indexFile =
-                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvRanges);
+                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvMetas);
         List<IndexFileMeta> indexFiles = Collections.singletonList(indexFile);
 
         CommitMessageImpl commitMessage =
@@ -106,6 +106,76 @@ public void testProduction() throws IOException {
         assertThat(deserialized).isEqualTo(manifestCommittable);
     }
 
+    @Test
+    public void testCompatibilityToVersion4() throws IOException {
+        SimpleStats keyStats =
+                new SimpleStats(
+                        singleColumn("min_key"),
+                        singleColumn("max_key"),
+                        fromLongArray(new Long[] {0L}));
+        SimpleStats valueStats =
+                new SimpleStats(
+                        singleColumn("min_value"),
+                        singleColumn("max_value"),
+                        fromLongArray(new Long[] {0L}));
+        DataFileMeta dataFile =
+                new DataFileMeta(
+                        "my_file",
+                        1024 * 1024,
+                        1024,
+                        singleColumn("min_key"),
+                        singleColumn("max_key"),
+                        keyStats,
+                        valueStats,
+                        15,
+                        200,
+                        5,
+                        3,
+                        Arrays.asList("extra1", "extra2"),
+                        Timestamp.fromLocalDateTime(LocalDateTime.parse("2022-03-02T20:20:12")),
+                        11L,
+                        new byte[] {1, 2, 4},
+                        FileSource.COMPACT,
+                        Arrays.asList("field1", "field2", "field3"));
+        List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
+
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>();
+        dvMetas.put("dv_key1", new DeletionVectorMeta("dv_key1", 1, 2, null));
+        dvMetas.put("dv_key2", new DeletionVectorMeta("dv_key2", 3, 4, null));
+        IndexFileMeta indexFile =
+                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvMetas);
+        List<IndexFileMeta> indexFiles = Collections.singletonList(indexFile);
+
+        CommitMessageImpl commitMessage =
+                new CommitMessageImpl(
+                        singleColumn("my_partition"),
+                        11,
+                        new DataIncrement(dataFiles, dataFiles, dataFiles),
+                        new CompactIncrement(dataFiles, dataFiles, dataFiles),
+                        new IndexIncrement(indexFiles));
+
+        ManifestCommittable manifestCommittable =
+                new ManifestCommittable(
+                        5,
+                        202020L,
+                        Collections.singletonMap(5, 555L),
+                        Collections.singletonList(commitMessage));
+
+        ManifestCommittableSerializer serializer = new ManifestCommittableSerializer();
+        byte[] bytes = serializer.serialize(manifestCommittable);
+        ManifestCommittable deserialized = serializer.deserialize(3, bytes);
+        assertThat(deserialized).isEqualTo(manifestCommittable);
+
+        byte[] v2Bytes =
+                IOUtils.readFully(
+                        ManifestCommittableSerializerCompatibilityTest.class
+                                .getClassLoader()
+                                .getResourceAsStream("compatibility/manifest-committable-v4"),
+                        true);
+        deserialized = serializer.deserialize(2, v2Bytes);
+        assertThat(deserialized).isEqualTo(manifestCommittable);
+    }
+
     @Test
     public void testCompatibilityToVersion3() throws IOException {
         SimpleStats keyStats =
@@ -139,11 +209,11 @@ public void testCompatibilityToVersion3() throws IOException {
                         null);
         List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
 
-        LinkedHashMap<String, Pair<Integer, Integer>> dvRanges = new LinkedHashMap<>();
-        dvRanges.put("dv_key1", Pair.of(1, 2));
-        dvRanges.put("dv_key2", Pair.of(3, 4));
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>();
+        dvMetas.put("dv_key1", new DeletionVectorMeta("dv_key1", 1, 2, null));
+        dvMetas.put("dv_key2", new DeletionVectorMeta("dv_key2", 3, 4, null));
         IndexFileMeta indexFile =
-                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvRanges);
+                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvMetas);
         List<IndexFileMeta> indexFiles = Collections.singletonList(indexFile);
 
         CommitMessageImpl commitMessage =
@@ -209,11 +279,11 @@ public void testCompatibilityToVersion2() throws IOException {
                         null);
         List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
 
-        LinkedHashMap<String, Pair<Integer, Integer>> dvRanges = new LinkedHashMap<>();
-        dvRanges.put("dv_key1", Pair.of(1, 2));
-        dvRanges.put("dv_key2", Pair.of(3, 4));
+        LinkedHashMap<String, DeletionVectorMeta> dvMetas = new LinkedHashMap<>();
+        dvMetas.put("dv_key1", new DeletionVectorMeta("dv_key1", 1, 2, null));
+        dvMetas.put("dv_key2", new DeletionVectorMeta("dv_key2", 3, 4, null));
         IndexFileMeta indexFile =
-                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvRanges);
+                new IndexFileMeta("my_index_type", "my_index_file", 1024 * 100, 1002, dvMetas);
         List<IndexFileMeta> indexFiles = Collections.singletonList(indexFile);
 
         CommitMessageImpl commitMessage =
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/sink/CommitMessageSerializerTest.java b/paimon-core/src/test/java/org/apache/paimon/table/sink/CommitMessageSerializerTest.java
index eb9105189b713..1f87838aea313 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/sink/CommitMessageSerializerTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/sink/CommitMessageSerializerTest.java
@@ -48,7 +48,7 @@ public void test() throws IOException {
         CommitMessageImpl committable =
                 new CommitMessageImpl(row(0), 1, dataIncrement, compactIncrement, indexIncrement);
         CommitMessageImpl newCommittable =
-                (CommitMessageImpl) serializer.deserialize(3, serializer.serialize(committable));
+                (CommitMessageImpl) serializer.deserialize(5, serializer.serialize(committable));
         assertThat(newCommittable.compactIncrement()).isEqualTo(committable.compactIncrement());
         assertThat(newCommittable.newFilesIncrement()).isEqualTo(committable.newFilesIncrement());
         assertThat(newCommittable.indexIncrement()).isEqualTo(committable.indexIncrement());
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
index c64a12ffae2c2..359d38c973db1 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
@@ -107,6 +107,9 @@ public void testSerializerNormal() throws Exception {
                         Arrays.asList("field1", "field2", "field3"));
         List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
 
+        DeletionFile deletionFile = new DeletionFile("deletion_file", 100, 22, 33L);
+        List<DeletionFile> deletionFiles = Collections.singletonList(deletionFile);
+
         BinaryRow partition = new BinaryRow(1);
         BinaryRowWriter binaryRowWriter = new BinaryRowWriter(partition);
         binaryRowWriter.writeString(0, BinaryString.fromString("aaaaa"));
@@ -118,6 +121,7 @@ public void testSerializerNormal() throws Exception {
                         .withPartition(partition)
                         .withBucket(20)
                         .withDataFiles(dataFiles)
+                        .withDataDeletionFiles(deletionFiles)
                         .withBucketPath("my path")
                         .build();
 
@@ -243,4 +247,68 @@ public void testSerializerCompatibleV2() throws Exception {
                 InstantiationUtil.deserializeObject(v2Bytes, DataSplit.class.getClassLoader());
         assertThat(actual).isEqualTo(split);
     }
+
+    @Test
+    public void testSerializerCompatibleV3() throws Exception {
+        SimpleStats keyStats =
+                new SimpleStats(
+                        singleColumn("min_key"),
+                        singleColumn("max_key"),
+                        fromLongArray(new Long[] {0L}));
+        SimpleStats valueStats =
+                new SimpleStats(
+                        singleColumn("min_value"),
+                        singleColumn("max_value"),
+                        fromLongArray(new Long[] {0L}));
+
+        DataFileMeta dataFile =
+                new DataFileMeta(
+                        "my_file",
+                        1024 * 1024,
+                        1024,
+                        singleColumn("min_key"),
+                        singleColumn("max_key"),
+                        keyStats,
+                        valueStats,
+                        15,
+                        200,
+                        5,
+                        3,
+                        Arrays.asList("extra1", "extra2"),
+                        Timestamp.fromLocalDateTime(LocalDateTime.parse("2022-03-02T20:20:12")),
+                        11L,
+                        new byte[] {1, 2, 4},
+                        FileSource.COMPACT,
+                        Arrays.asList("field1", "field2", "field3"));
+        List<DataFileMeta> dataFiles = Collections.singletonList(dataFile);
+
+        DeletionFile deletionFile = new DeletionFile("deletion_file", 100, 22, null);
+        List<DeletionFile> deletionFiles = Collections.singletonList(deletionFile);
+
+        BinaryRow partition = new BinaryRow(1);
+        BinaryRowWriter binaryRowWriter = new BinaryRowWriter(partition);
+        binaryRowWriter.writeString(0, BinaryString.fromString("aaaaa"));
+        binaryRowWriter.complete();
+
+        DataSplit split =
+                DataSplit.builder()
+                        .withSnapshot(18)
+                        .withPartition(partition)
+                        .withBucket(20)
+                        .withDataFiles(dataFiles)
+                        .withDataDeletionFiles(deletionFiles)
+                        .withBucketPath("my path")
+                        .build();
+
+        byte[] v2Bytes =
+                IOUtils.readFully(
+                        SplitTest.class
+                                .getClassLoader()
+                                .getResourceAsStream("compatibility/datasplit-v3"),
+                        true);
+
+        DataSplit actual =
+                InstantiationUtil.deserializeObject(v2Bytes, DataSplit.class.getClassLoader());
+        assertThat(actual).isEqualTo(split);
+    }
 }
diff --git a/paimon-core/src/test/resources/compatibility/datasplit-v3 b/paimon-core/src/test/resources/compatibility/datasplit-v3
new file mode 100644
index 0000000000000000000000000000000000000000..6b19fe2d958d3c80465def7a5e08d160210fc472
GIT binary patch
literal 886
zcma)4J#Q015S?=fk!=AXL<qVQqM$%`5E`U(kRTFW5s@xUGWM<QCFi?iZ|&F=5Glg6
z`~*r0egGvB4K)=NzX1LNZ$His&@j@wcQf;5c4qHB{-Whd(Var|BQCi+5K+l;SmcrB
zP9~zN7^$v^wpjCinMqB~R+gx>Ll--v?y=AZ)Rxu0R)U8z?;p@*#V3!8d@Pif=&?(!
zD(A8q6nZC3=vqhg3MIBgCbTT_Co&V2rq$#*k2xM`nZ=2$^kzbBC$xeW^ooLnTJFF-
z)&oszt|a5UALDc!jiRe5CjFzgFKwE{`CiSEF`pSh)2#&i$8P`F?H?O`{7B}krq7C#
z%}M!^sImRy%eQ-XZ~pAz8kYQBtbx~o!286;h~C)v%5WN%n72+s6@0Iq;q<VF{ofL;
zy3hqjrrkTh@CV=s_zau^Av#<E8~f^rmOa-a-GKidx}#(_c@1v+e9*85oFQZ_#PgGL
z>JZ@@9v+J+X0o=3^W=QoCe3^yVE7?mw%7w;i@N{lHy69w`SUj3Lcs7-!1ONx*u10(
z$HdLtW6nmxWEb|Y4txBqn~Qv1!?T!Z#rJ7ud4p#4{r05DQp7DIZutStOrId2OR4|4
O?br3aQqR|kCcgozH>H#S

literal 0
HcmV?d00001

diff --git a/paimon-core/src/test/resources/compatibility/manifest-committable-v4 b/paimon-core/src/test/resources/compatibility/manifest-committable-v4
new file mode 100644
index 0000000000000000000000000000000000000000..9c095669a34b8806fa6ccf29d77b578c1631e117
GIT binary patch
literal 3145
zcmeH}y-EW?5XUzk7NVksg5?!<HYPTfmLe%q+Qoxh;4q0HoFS<cgrv<QSo#Q-mOg^d
z;8XaU-JQ)D1uZRh;J^Qy*^k?so7o*>tZX={9USpc0p3tO=DF@|+J|b)HrNA$S!a}v
zi@eBhhhj&z0Bcm<twzI`Uf$0ZZUzQf5!nYz&(H8Rcm)q2VTD~-<js+8%GA7m2tP6I
zx^>yQhvmg0m8yNgBPJ^e?Tb^?WCr=LbCb>3la-Y{otEvkQ}&qv;WHrL-3G{N-XGQr
zgWcTFienQXd;w(r5kSI}O%$=qz9(t_E|cDsd>_Ymtd9$W{Jg5?Y+8)dhM8M#nz{P7
zmuLMhcFWi;pPD(-SStQsao?a6FYEsG?zR6lL5cs@c|_wY=C4M`4|yK*w|owV)GFtj
zdM}>OoYV1q{xx1g5NY6ej`y!~gfIGHef2NuD<dVbl^xm>AbbwY(na!zzeukzwE=Z@
wKI~@GPB9xveHe79zR|VbOL&&MS6J#<mF`4RsIkyI(eYpVn+v_a>)HW-0#@!u7ytkO

literal 0
HcmV?d00001

diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
index ea8309e14ffef..46a423b9d699e 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/DeletionVectorTest.scala
@@ -631,6 +631,27 @@ class DeletionVectorTest extends PaimonSparkTestBase with AdaptiveSparkPlanHelpe
     )
   }
 
+  test("Paimon deletionVector: get cardinality") {
+    sql(s"""
+           |CREATE TABLE T (id INT)
+           |TBLPROPERTIES (
+           | 'deletion-vectors.enabled' = 'true',
+           | 'bucket-key' = 'id',
+           | 'bucket' = '1'
+           |)
+           |""".stripMargin)
+
+    sql("INSERT INTO T SELECT /*+ REPARTITION(1) */ id FROM range (1, 50000)")
+    sql("DELETE FROM T WHERE id >= 111 and id <= 444")
+
+    val fileStore = loadTable("T").store()
+    val indexManifest = fileStore.snapshotManager().latestSnapshot().indexManifest()
+    val entry = fileStore.newIndexFileHandler().readManifest(indexManifest).get(0)
+    val dvMeta = entry.indexFile().deletionVectorMetas().values().iterator().next()
+
+    assert(dvMeta.cardinality() == 334)
+  }
+
   private def getPathName(path: String): String = {
     new Path(path).getName
   }

From d61f3d2659572d44fc028e5e16f957504ee1a7f8 Mon Sep 17 00:00:00 2001
From: JackeyLee007 <JackeyLee007@126.com>
Date: Sun, 15 Dec 2024 13:44:47 +0800
Subject: [PATCH 155/157] [flink] kafka_sync_database supports different prefix
 and suffix for different db (#4704)

---
 docs/content/cdc-ingestion/kafka-cdc.md       |  2 +
 .../generated/kafka_sync_database.html        | 12 ++++-
 .../action/cdc/CdcActionCommonUtils.java      |  2 +
 .../action/cdc/SyncDatabaseActionBase.java    | 34 +++++++++++++-
 .../cdc/SyncDatabaseActionFactoryBase.java    |  4 ++
 .../flink/action/cdc/TableNameConverter.java  | 47 ++++++++++++++++---
 .../cdc/mysql/MySqlSyncDatabaseAction.java    |  3 +-
 .../action/cdc/TableNameConverterTest.java    | 42 +++++++++++++++--
 pom.xml                                       |  1 +
 9 files changed, 133 insertions(+), 14 deletions(-)

diff --git a/docs/content/cdc-ingestion/kafka-cdc.md b/docs/content/cdc-ingestion/kafka-cdc.md
index b037937c554f1..26a5be3409424 100644
--- a/docs/content/cdc-ingestion/kafka-cdc.md
+++ b/docs/content/cdc-ingestion/kafka-cdc.md
@@ -199,7 +199,9 @@ To use this feature through `flink run`, run the following shell command.
     --warehouse <warehouse-path> \
     --database <database-name> \
     [--table_mapping <table-name>=<paimon-table-name>] \
+    [--table_prefix_db <paimon-table-prefix-by-db>] \
     [--table_prefix <paimon-table-prefix>] \
+    [--table_suffix_db <paimon-table-suffix-by-db>] \
     [--table_suffix <paimon-table-suffix>] \
     [--including_tables <table-name|name-regular-expr>] \
     [--excluding_tables <table-name|name-regular-expr>] \
diff --git a/docs/layouts/shortcodes/generated/kafka_sync_database.html b/docs/layouts/shortcodes/generated/kafka_sync_database.html
index 6c90f1d7f7d83..3664128a26cac 100644
--- a/docs/layouts/shortcodes/generated/kafka_sync_database.html
+++ b/docs/layouts/shortcodes/generated/kafka_sync_database.html
@@ -41,13 +41,21 @@
         <td><h5>--table_mapping</h5></td>
         <td>The table name mapping between source database and Paimon. For example, if you want to synchronize a source table named "test" to a Paimon table named "paimon_test", you can specify "--table_mapping test=paimon_test". Multiple mappings could be specified with multiple "--table_mapping" options. "--table_mapping" has higher priority than "--table_prefix" and "--table_suffix".</td>
     </tr>
+    <tr>
+        <td><h5>--table_prefix_db</h5></td>
+        <td>The prefix of the Paimon tables to be synchronized from the specified db. For example, if you want to prefix the tables from db1 with "ods_db1_", you can specify "--table_prefix_db db1=ods_db1_". "--table_prefix_db" has higher priority than "--table_prefix".</td>
+    </tr>
     <tr>
         <td><h5>--table_prefix</h5></td>
-        <td>The prefix of all Paimon tables to be synchronized. For example, if you want all synchronized tables to have "ods_" as prefix, you can specify "--table_prefix ods_".</td>
+        <td>The prefix of all Paimon tables to be synchronized except those specified by "--table_mapping" or "--table_prefix_db". For example, if you want all synchronized tables to have "ods_" as prefix, you can specify "--table_prefix ods_".</td>
+    </tr>
+    <tr>
+        <td><h5>--table_suffix_db</h5></td>
+        <td>The suffix of the Paimon tables to be synchronized from the specified db. The usage is same as "--table_prefix_db".</td>
     </tr>
     <tr>
         <td><h5>--table_suffix</h5></td>
-        <td>The suffix of all Paimon tables to be synchronized. The usage is same as "--table_prefix".</td>
+        <td>The suffix of all Paimon tables to be synchronized except those specified by "--table_mapping" or "--table_suffix_db". The usage is same as "--table_prefix".</td>
     </tr>
     <tr>
         <td><h5>--including_tables</h5></td>
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
index 83891c90b8e15..c8af6f91c4201 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/CdcActionCommonUtils.java
@@ -56,6 +56,8 @@ public class CdcActionCommonUtils {
     public static final String PULSAR_CONF = "pulsar_conf";
     public static final String TABLE_PREFIX = "table_prefix";
     public static final String TABLE_SUFFIX = "table_suffix";
+    public static final String TABLE_PREFIX_DB = "table_prefix_db";
+    public static final String TABLE_SUFFIX_DB = "table_suffix_db";
     public static final String TABLE_MAPPING = "table_mapping";
     public static final String INCLUDING_TABLES = "including_tables";
     public static final String EXCLUDING_TABLES = "excluding_tables";
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
index ac3483ac23bf0..4fb1339c51934 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionBase.java
@@ -53,6 +53,8 @@ public abstract class SyncDatabaseActionBase extends SynchronizationActionBase {
     protected String tablePrefix = "";
     protected String tableSuffix = "";
     protected Map<String, String> tableMapping = new HashMap<>();
+    protected Map<String, String> dbPrefix = new HashMap<>();
+    protected Map<String, String> dbSuffix = new HashMap<>();
     protected String includingTables = ".*";
     protected List<String> partitionKeys = new ArrayList<>();
     protected List<String> primaryKeys = new ArrayList<>();
@@ -98,6 +100,30 @@ public SyncDatabaseActionBase withTableSuffix(@Nullable String tableSuffix) {
         return this;
     }
 
+    public SyncDatabaseActionBase withDbPrefix(Map<String, String> dbPrefix) {
+        if (dbPrefix != null) {
+            this.dbPrefix =
+                    dbPrefix.entrySet().stream()
+                            .collect(
+                                    HashMap::new,
+                                    (m, e) -> m.put(e.getKey().toLowerCase(), e.getValue()),
+                                    HashMap::putAll);
+        }
+        return this;
+    }
+
+    public SyncDatabaseActionBase withDbSuffix(Map<String, String> dbSuffix) {
+        if (dbSuffix != null) {
+            this.dbSuffix =
+                    dbSuffix.entrySet().stream()
+                            .collect(
+                                    HashMap::new,
+                                    (m, e) -> m.put(e.getKey().toLowerCase(), e.getValue()),
+                                    HashMap::putAll);
+        }
+        return this;
+    }
+
     public SyncDatabaseActionBase withTableMapping(Map<String, String> tableMapping) {
         if (tableMapping != null) {
             this.tableMapping = tableMapping;
@@ -164,7 +190,13 @@ protected EventParser.Factory<RichCdcMultiplexRecord> buildEventParserFactory()
                 excludingTables == null ? null : Pattern.compile(excludingTables);
         TableNameConverter tableNameConverter =
                 new TableNameConverter(
-                        allowUpperCase, mergeShards, tablePrefix, tableSuffix, tableMapping);
+                        allowUpperCase,
+                        mergeShards,
+                        dbPrefix,
+                        dbSuffix,
+                        tablePrefix,
+                        tableSuffix,
+                        tableMapping);
         Set<String> createdTables;
         try {
             createdTables = new HashSet<>(catalog.listTables(database));
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
index 2135f2a28112d..d497b588c2af6 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/SyncDatabaseActionFactoryBase.java
@@ -31,7 +31,9 @@
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.PRIMARY_KEYS;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_MAPPING;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_PREFIX;
+import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_PREFIX_DB;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_SUFFIX;
+import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TABLE_SUFFIX_DB;
 import static org.apache.paimon.flink.action.cdc.CdcActionCommonUtils.TYPE_MAPPING;
 
 /** Base {@link ActionFactory} for synchronizing into database. */
@@ -52,6 +54,8 @@ public Optional<Action> create(MultipleParameterToolAdapter params) {
     protected void withParams(MultipleParameterToolAdapter params, T action) {
         action.withTablePrefix(params.get(TABLE_PREFIX))
                 .withTableSuffix(params.get(TABLE_SUFFIX))
+                .withDbPrefix(optionalConfigMap(params, TABLE_PREFIX_DB))
+                .withDbSuffix(optionalConfigMap(params, TABLE_SUFFIX_DB))
                 .withTableMapping(optionalConfigMap(params, TABLE_MAPPING))
                 .includingTables(params.get(INCLUDING_TABLES))
                 .excludingTables(params.get(EXCLUDING_TABLES))
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
index 4eca8b903ed1e..15fc3507ce2db 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/TableNameConverter.java
@@ -31,6 +31,8 @@ public class TableNameConverter implements Serializable {
 
     private final boolean caseSensitive;
     private final boolean mergeShards;
+    private final Map<String, String> dbPrefix;
+    private final Map<String, String> dbSuffix;
     private final String prefix;
     private final String suffix;
     private final Map<String, String> tableMapping;
@@ -45,21 +47,54 @@ public TableNameConverter(
             String prefix,
             String suffix,
             Map<String, String> tableMapping) {
+        this(
+                caseSensitive,
+                mergeShards,
+                new HashMap<>(),
+                new HashMap<>(),
+                prefix,
+                suffix,
+                tableMapping);
+    }
+
+    public TableNameConverter(
+            boolean caseSensitive,
+            boolean mergeShards,
+            Map<String, String> dbPrefix,
+            Map<String, String> dbSuffix,
+            String prefix,
+            String suffix,
+            Map<String, String> tableMapping) {
         this.caseSensitive = caseSensitive;
         this.mergeShards = mergeShards;
+        this.dbPrefix = dbPrefix;
+        this.dbSuffix = dbSuffix;
         this.prefix = prefix;
         this.suffix = suffix;
         this.tableMapping = lowerMapKey(tableMapping);
     }
 
-    public String convert(String originName) {
-        if (tableMapping.containsKey(originName.toLowerCase())) {
-            String mappedName = tableMapping.get(originName.toLowerCase());
+    public String convert(String originDbName, String originTblName) {
+        // top priority: table mapping
+        if (tableMapping.containsKey(originTblName.toLowerCase())) {
+            String mappedName = tableMapping.get(originTblName.toLowerCase());
             return caseSensitive ? mappedName : mappedName.toLowerCase();
         }
 
-        String tableName = caseSensitive ? originName : originName.toLowerCase();
-        return prefix + tableName + suffix;
+        String tblPrefix = prefix;
+        String tblSuffix = suffix;
+
+        // second priority: prefix and postfix specified by db
+        if (dbPrefix.containsKey(originDbName.toLowerCase())) {
+            tblPrefix = dbPrefix.get(originDbName.toLowerCase());
+        }
+        if (dbSuffix.containsKey(originDbName.toLowerCase())) {
+            tblSuffix = dbSuffix.get(originDbName.toLowerCase());
+        }
+
+        // third priority: normal prefix and suffix
+        String tableName = caseSensitive ? originTblName : originTblName.toLowerCase();
+        return tblPrefix + tableName + tblSuffix;
     }
 
     public String convert(Identifier originIdentifier) {
@@ -69,7 +104,7 @@ public String convert(Identifier originIdentifier) {
                         : originIdentifier.getDatabaseName()
                                 + "_"
                                 + originIdentifier.getObjectName();
-        return convert(rawName);
+        return convert(originIdentifier.getDatabaseName(), rawName);
     }
 
     private Map<String, String> lowerMapKey(Map<String, String> map) {
diff --git a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
index 235b3f9a3235f..ce2e9124a664a 100644
--- a/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
+++ b/paimon-flink/paimon-flink-cdc/src/main/java/org/apache/paimon/flink/action/cdc/mysql/MySqlSyncDatabaseAction.java
@@ -143,7 +143,8 @@ protected void beforeBuildingSourceSink() throws Exception {
         for (JdbcTableInfo tableInfo : jdbcTableInfos) {
             Identifier identifier =
                     Identifier.create(
-                            database, tableNameConverter.convert(tableInfo.toPaimonTableName()));
+                            database,
+                            tableNameConverter.convert("", tableInfo.toPaimonTableName()));
             FileStoreTable table;
             Schema fromMySql =
                     CdcActionCommonUtils.buildPaimonSchema(
diff --git a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java
index dfbe32e3d398b..89bbadfeb8c83 100644
--- a/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java
+++ b/paimon-flink/paimon-flink-cdc/src/test/java/org/apache/paimon/flink/action/cdc/TableNameConverterTest.java
@@ -33,13 +33,47 @@ public void testConvertTableName() {
         tableMapping.put("mapped_src", "mapped_TGT");
         TableNameConverter caseConverter =
                 new TableNameConverter(true, true, "pre_", "_pos", tableMapping);
-        Assert.assertEquals(caseConverter.convert("mapped_SRC"), "mapped_TGT");
+        Assert.assertEquals(caseConverter.convert("", "mapped_SRC"), "mapped_TGT");
 
-        Assert.assertEquals(caseConverter.convert("unmapped_src"), "pre_unmapped_src_pos");
+        Assert.assertEquals(caseConverter.convert("", "unmapped_src"), "pre_unmapped_src_pos");
 
         TableNameConverter noCaseConverter =
                 new TableNameConverter(false, true, "pre_", "_pos", tableMapping);
-        Assert.assertEquals(noCaseConverter.convert("mapped_src"), "mapped_tgt");
-        Assert.assertEquals(noCaseConverter.convert("unmapped_src"), "pre_unmapped_src_pos");
+        Assert.assertEquals(noCaseConverter.convert("", "mapped_src"), "mapped_tgt");
+        Assert.assertEquals(noCaseConverter.convert("", "unmapped_src"), "pre_unmapped_src_pos");
+    }
+
+    @Test
+    public void testConvertTableNameByDBPrefix_Suffix() {
+        Map<String, String> dbPrefix = new HashMap<>(2);
+        dbPrefix.put("db_with_prefix", "db_pref_");
+        dbPrefix.put("db_with_prefix_suffix", "db_pref_");
+
+        Map<String, String> dbSuffix = new HashMap<>(2);
+        dbSuffix.put("db_with_suffix", "_db_suff");
+        dbSuffix.put("db_with_prefix_suffix", "_db_suff");
+
+        TableNameConverter tblNameConverter =
+                new TableNameConverter(false, true, dbPrefix, dbSuffix, "pre_", "_suf", null);
+
+        // Tables in the specified db should have the specified prefix and suffix.
+
+        // db prefix + normal suffix
+        Assert.assertEquals(
+                "db_pref_table_name_suf", tblNameConverter.convert("db_with_prefix", "table_name"));
+
+        // normal prefix + db suffix
+        Assert.assertEquals(
+                "pre_table_name_db_suff", tblNameConverter.convert("db_with_suffix", "table_name"));
+
+        // db prefix + db suffix
+        Assert.assertEquals(
+                "db_pref_table_name_db_suff",
+                tblNameConverter.convert("db_with_prefix_suffix", "table_name"));
+
+        // only normal prefix and suffix
+        Assert.assertEquals(
+                "pre_table_name_suf",
+                tblNameConverter.convert("db_without_prefix_suffix", "table_name"));
     }
 }
diff --git a/pom.xml b/pom.xml
index 904b1c73c7414..dbef98af06b21 100644
--- a/pom.xml
+++ b/pom.xml
@@ -529,6 +529,7 @@ under the License.
                         <exclude>release/**</exclude>
                         <!-- antlr grammar files -->
                         <exclude>paimon-common/src/main/antlr4/**</exclude>
+                        <exclude>paimon-core/src/test/resources/compatibility/**</exclude>
                     </excludes>
                 </configuration>
             </plugin>

From 72e71503394dbf1269560cf373f5ea6186d134db Mon Sep 17 00:00:00 2001
From: WenjunMin <aitozi@apache.org>
Date: Sun, 15 Dec 2024 22:33:17 +0800
Subject: [PATCH 156/157] [core] Tolerate the NoSuchObjectException when report
 the partition statistic (#4708)

---
 .../paimon/metastore/MetastoreClient.java     |  3 ++-
 .../flink/sink/partition/HmsReporter.java     |  2 +-
 .../partition/AddDonePartitionActionTest.java |  3 ++-
 .../flink/sink/partition/HmsReporterTest.java |  3 ++-
 .../paimon/hive/HiveMetastoreClient.java      | 27 +++++++++++++------
 5 files changed, 26 insertions(+), 12 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/metastore/MetastoreClient.java b/paimon-core/src/main/java/org/apache/paimon/metastore/MetastoreClient.java
index 60e28c59f45dc..75f7af5abbdc1 100644
--- a/paimon-core/src/main/java/org/apache/paimon/metastore/MetastoreClient.java
+++ b/paimon-core/src/main/java/org/apache/paimon/metastore/MetastoreClient.java
@@ -55,7 +55,8 @@ default void addPartitionsSpec(List<LinkedHashMap<String, String>> partitionSpec
     default void alterPartition(
             LinkedHashMap<String, String> partitionSpec,
             Map<String, String> parameters,
-            long modifyTime)
+            long modifyTime,
+            boolean ignoreIfNotExist)
             throws Exception {
         throw new UnsupportedOperationException();
     }
diff --git a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/partition/HmsReporter.java b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/partition/HmsReporter.java
index eb965aa3a3188..853dc52c20bfc 100644
--- a/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/partition/HmsReporter.java
+++ b/paimon-flink/paimon-flink-common/src/main/java/org/apache/paimon/flink/sink/partition/HmsReporter.java
@@ -93,7 +93,7 @@ public void report(String partition, long modifyTime) throws Exception {
             statistic.put(HIVE_LAST_UPDATE_TIME_PROP, String.valueOf(modifyTime / 1000));
 
             LOG.info("alter partition {} with statistic {}.", partitionSpec, statistic);
-            metastoreClient.alterPartition(partitionSpec, statistic, modifyTime);
+            metastoreClient.alterPartition(partitionSpec, statistic, modifyTime, true);
         }
     }
 
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/AddDonePartitionActionTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/AddDonePartitionActionTest.java
index 19c22d137c7f2..fca5dcf0ed69d 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/AddDonePartitionActionTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/AddDonePartitionActionTest.java
@@ -66,7 +66,8 @@ public void markDone(LinkedHashMap<String, String> partitionSpec)
                     public void alterPartition(
                             LinkedHashMap<String, String> partitionSpec,
                             Map<String, String> parameters,
-                            long modifyTime)
+                            long modifyTime,
+                            boolean ignoreIfNotExist)
                             throws Exception {
                         throw new UnsupportedOperationException();
                     }
diff --git a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/HmsReporterTest.java b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/HmsReporterTest.java
index 0050f3083a8ec..f245940da57d8 100644
--- a/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/HmsReporterTest.java
+++ b/paimon-flink/paimon-flink-common/src/test/java/org/apache/paimon/flink/sink/partition/HmsReporterTest.java
@@ -117,7 +117,8 @@ public void markDone(LinkedHashMap<String, String> partitionSpec)
                     public void alterPartition(
                             LinkedHashMap<String, String> partitionSpec,
                             Map<String, String> parameters,
-                            long modifyTime)
+                            long modifyTime,
+                            boolean ignoreIfNotExist)
                             throws Exception {
                         partitionParams.put(
                                 PartitionPathUtils.generatePartitionPath(partitionSpec),
diff --git a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
index 3793c86f82693..885fa463e5a7d 100644
--- a/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
+++ b/paimon-hive/paimon-hive-catalog/src/main/java/org/apache/paimon/hive/HiveMetastoreClient.java
@@ -119,17 +119,28 @@ public void addPartitionsSpec(List<LinkedHashMap<String, String>> partitionSpecs
     public void alterPartition(
             LinkedHashMap<String, String> partitionSpec,
             Map<String, String> parameters,
-            long modifyTime)
+            long modifyTime,
+            boolean ignoreIfNotExist)
             throws Exception {
         List<String> partitionValues = new ArrayList<>(partitionSpec.values());
         int currentTime = (int) (modifyTime / 1000);
-        Partition hivePartition =
-                clients.run(
-                        client ->
-                                client.getPartition(
-                                        identifier.getDatabaseName(),
-                                        identifier.getObjectName(),
-                                        partitionValues));
+        Partition hivePartition;
+        try {
+            hivePartition =
+                    clients.run(
+                            client ->
+                                    client.getPartition(
+                                            identifier.getDatabaseName(),
+                                            identifier.getObjectName(),
+                                            partitionValues));
+        } catch (NoSuchObjectException e) {
+            if (ignoreIfNotExist) {
+                return;
+            } else {
+                throw e;
+            }
+        }
+
         hivePartition.setValues(partitionValues);
         hivePartition.setLastAccessTime(currentTime);
         hivePartition.getParameters().putAll(parameters);

From 9179d654b61d933551baffe36cbcd675869f1ebc Mon Sep 17 00:00:00 2001
From: Zouxxyy <zouxinyu.zxy@alibaba-inc.com>
Date: Sun, 15 Dec 2024 22:36:47 +0800
Subject: [PATCH 157/157] [core][spark] Enable limit pushdown and count
 optimization for dv table (#4709)

---
 .../apache/paimon/table/source/DataSplit.java | 40 +++++++++++
 .../table/source/DataTableBatchScan.java      | 19 +-----
 .../table/source/SplitGeneratorTest.java      |  4 +-
 .../apache/paimon/table/source/SplitTest.java | 67 +++++++++++++++++++
 .../paimon/spark/PaimonScanBuilder.scala      | 12 ++--
 .../spark/aggregate/LocalAggregator.scala     | 22 +++---
 .../paimon/spark/sql/PaimonPushDownTest.scala | 52 ++++++++++----
 .../spark/sql/PushDownAggregatesTest.scala    | 66 +++++++++++++-----
 8 files changed, 216 insertions(+), 66 deletions(-)

diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
index 29405466b93f1..b9460f28b4e79 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DataSplit.java
@@ -44,6 +44,7 @@
 
 import static org.apache.paimon.io.DataFilePathFactory.INDEX_PATH_SUFFIX;
 import static org.apache.paimon.utils.Preconditions.checkArgument;
+import static org.apache.paimon.utils.Preconditions.checkState;
 
 /** Input splits. Needed by most batch computation engines. */
 public class DataSplit implements Split {
@@ -126,6 +127,45 @@ public long rowCount() {
         return rowCount;
     }
 
+    /** Whether it is possible to calculate the merged row count. */
+    public boolean mergedRowCountAvailable() {
+        return rawConvertible
+                && (dataDeletionFiles == null
+                        || dataDeletionFiles.stream()
+                                .allMatch(f -> f == null || f.cardinality() != null));
+    }
+
+    public long mergedRowCount() {
+        checkState(mergedRowCountAvailable());
+        return partialMergedRowCount();
+    }
+
+    /**
+     * Obtain merged row count as much as possible. There are two scenarios where accurate row count
+     * can be calculated:
+     *
+     * <p>1. raw file and no deletion file.
+     *
+     * <p>2. raw file + deletion file with cardinality.
+     */
+    public long partialMergedRowCount() {
+        long sum = 0L;
+        if (rawConvertible) {
+            List<RawFile> rawFiles = convertToRawFiles().orElse(null);
+            if (rawFiles != null) {
+                for (int i = 0; i < rawFiles.size(); i++) {
+                    RawFile rawFile = rawFiles.get(i);
+                    if (dataDeletionFiles == null || dataDeletionFiles.get(i) == null) {
+                        sum += rawFile.rowCount();
+                    } else if (dataDeletionFiles.get(i).cardinality() != null) {
+                        sum += rawFile.rowCount() - dataDeletionFiles.get(i).cardinality();
+                    }
+                }
+            }
+        }
+        return sum;
+    }
+
     @Override
     public Optional<List<RawFile>> convertToRawFiles() {
         if (rawConvertible) {
diff --git a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
index 635802cc9dcbb..a4fe6d73bba19 100644
--- a/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
+++ b/paimon-core/src/main/java/org/apache/paimon/table/source/DataTableBatchScan.java
@@ -28,7 +28,6 @@
 
 import java.util.ArrayList;
 import java.util.List;
-import java.util.Objects;
 
 import static org.apache.paimon.CoreOptions.MergeEngine.FIRST_ROW;
 
@@ -103,9 +102,9 @@ private StartingScanner.Result applyPushDownLimit(StartingScanner.Result result)
             List<Split> limitedSplits = new ArrayList<>();
             for (DataSplit dataSplit : splits) {
                 if (dataSplit.rawConvertible()) {
-                    long splitRowCount = getRowCountForSplit(dataSplit);
+                    long partialMergedRowCount = dataSplit.partialMergedRowCount();
                     limitedSplits.add(dataSplit);
-                    scannedRowCount += splitRowCount;
+                    scannedRowCount += partialMergedRowCount;
                     if (scannedRowCount >= pushDownLimit) {
                         SnapshotReader.Plan newPlan =
                                 new PlanImpl(plan.watermark(), plan.snapshotId(), limitedSplits);
@@ -117,20 +116,6 @@ private StartingScanner.Result applyPushDownLimit(StartingScanner.Result result)
         return result;
     }
 
-    /**
-     * 0 represents that we can't compute the row count of this split: 1. the split needs to be
-     * merged; 2. the table enabled deletion vector and there are some deletion files.
-     */
-    private long getRowCountForSplit(DataSplit split) {
-        if (split.deletionFiles().isPresent()
-                && split.deletionFiles().get().stream().anyMatch(Objects::nonNull)) {
-            return 0L;
-        }
-        return split.convertToRawFiles()
-                .map(files -> files.stream().map(RawFile::rowCount).reduce(Long::sum).orElse(0L))
-                .orElse(0L);
-    }
-
     @Override
     public DataTableScan withShard(int indexOfThisSubtask, int numberOfParallelSubtasks) {
         snapshotReader.withShard(indexOfThisSubtask, numberOfParallelSubtasks);
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitGeneratorTest.java b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitGeneratorTest.java
index a9e093dab124e..a1f7d69e28779 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitGeneratorTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitGeneratorTest.java
@@ -43,10 +43,10 @@
 public class SplitGeneratorTest {
 
     public static DataFileMeta newFileFromSequence(
-            String name, int rowCount, long minSequence, long maxSequence) {
+            String name, int fileSize, long minSequence, long maxSequence) {
         return new DataFileMeta(
                 name,
-                rowCount,
+                fileSize,
                 1,
                 EMPTY_ROW,
                 EMPTY_ROW,
diff --git a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
index 359d38c973db1..0219941a0ac0b 100644
--- a/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
+++ b/paimon-core/src/test/java/org/apache/paimon/table/source/SplitTest.java
@@ -49,6 +49,41 @@
 /** Test for {@link DataSplit}. */
 public class SplitTest {
 
+    @Test
+    public void testSplitMergedRowCount() {
+        // not rawConvertible
+        List<DataFileMeta> dataFiles =
+                Arrays.asList(newDataFile(1000L), newDataFile(2000L), newDataFile(3000L));
+        DataSplit split = newDataSplit(false, dataFiles, null);
+        assertThat(split.partialMergedRowCount()).isEqualTo(0L);
+        assertThat(split.mergedRowCountAvailable()).isEqualTo(false);
+
+        // rawConvertible without deletion files
+        split = newDataSplit(true, dataFiles, null);
+        assertThat(split.partialMergedRowCount()).isEqualTo(6000L);
+        assertThat(split.mergedRowCountAvailable()).isEqualTo(true);
+        assertThat(split.mergedRowCount()).isEqualTo(6000L);
+
+        // rawConvertible with deletion files without cardinality
+        ArrayList<DeletionFile> deletionFiles = new ArrayList<>();
+        deletionFiles.add(null);
+        deletionFiles.add(new DeletionFile("p", 1, 2, null));
+        deletionFiles.add(new DeletionFile("p", 1, 2, 100L));
+        split = newDataSplit(true, dataFiles, deletionFiles);
+        assertThat(split.partialMergedRowCount()).isEqualTo(3900L);
+        assertThat(split.mergedRowCountAvailable()).isEqualTo(false);
+
+        // rawConvertible with deletion files with cardinality
+        deletionFiles = new ArrayList<>();
+        deletionFiles.add(null);
+        deletionFiles.add(new DeletionFile("p", 1, 2, 200L));
+        deletionFiles.add(new DeletionFile("p", 1, 2, 100L));
+        split = newDataSplit(true, dataFiles, deletionFiles);
+        assertThat(split.partialMergedRowCount()).isEqualTo(5700L);
+        assertThat(split.mergedRowCountAvailable()).isEqualTo(true);
+        assertThat(split.mergedRowCount()).isEqualTo(5700L);
+    }
+
     @Test
     public void testSerializer() throws IOException {
         DataFileTestDataGenerator gen = DataFileTestDataGenerator.builder().build();
@@ -311,4 +346,36 @@ public void testSerializerCompatibleV3() throws Exception {
                 InstantiationUtil.deserializeObject(v2Bytes, DataSplit.class.getClassLoader());
         assertThat(actual).isEqualTo(split);
     }
+
+    private DataFileMeta newDataFile(long rowCount) {
+        return DataFileMeta.forAppend(
+                "my_data_file.parquet",
+                1024 * 1024,
+                rowCount,
+                null,
+                0L,
+                rowCount,
+                1,
+                Collections.emptyList(),
+                null,
+                null,
+                null);
+    }
+
+    private DataSplit newDataSplit(
+            boolean rawConvertible,
+            List<DataFileMeta> dataFiles,
+            List<DeletionFile> deletionFiles) {
+        DataSplit.Builder builder = DataSplit.builder();
+        builder.withSnapshot(1)
+                .withPartition(BinaryRow.EMPTY_ROW)
+                .withBucket(1)
+                .withBucketPath("my path")
+                .rawConvertible(rawConvertible)
+                .withDataFiles(dataFiles);
+        if (deletionFiles != null) {
+            builder.withDataDeletionFiles(deletionFiles);
+        }
+        return builder.build();
+    }
 }
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonScanBuilder.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonScanBuilder.scala
index d8b66e1cd1e03..0393a1cd15786 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonScanBuilder.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/PaimonScanBuilder.scala
@@ -21,6 +21,7 @@ package org.apache.paimon.spark
 import org.apache.paimon.predicate.PredicateBuilder
 import org.apache.paimon.spark.aggregate.LocalAggregator
 import org.apache.paimon.table.Table
+import org.apache.paimon.table.source.DataSplit
 
 import org.apache.spark.sql.connector.expressions.aggregate.Aggregation
 import org.apache.spark.sql.connector.read.{Scan, SupportsPushDownAggregates, SupportsPushDownLimit}
@@ -36,12 +37,12 @@ class PaimonScanBuilder(table: Table)
   override def pushLimit(limit: Int): Boolean = {
     // It is safe, since we will do nothing if it is the primary table and the split is not `rawConvertible`
     pushDownLimit = Some(limit)
-    // just make a best effort to push down limit
+    // just make the best effort to push down limit
     false
   }
 
   override def supportCompletePushDown(aggregation: Aggregation): Boolean = {
-    // for now we only support complete push down, so there is no difference with `pushAggregation`
+    // for now, we only support complete push down, so there is no difference with `pushAggregation`
     pushAggregation(aggregation)
   }
 
@@ -66,8 +67,11 @@ class PaimonScanBuilder(table: Table)
       val pushedPartitionPredicate = PredicateBuilder.and(pushedPredicates.map(_._2): _*)
       readBuilder.withFilter(pushedPartitionPredicate)
     }
-    val scan = readBuilder.newScan()
-    scan.listPartitionEntries.asScala.foreach(aggregator.update)
+    val dataSplits = readBuilder.newScan().plan().splits().asScala.map(_.asInstanceOf[DataSplit])
+    if (!dataSplits.forall(_.mergedRowCountAvailable())) {
+      return false
+    }
+    dataSplits.foreach(aggregator.update)
     localScan = Some(
       PaimonLocalScan(
         aggregator.result(),
diff --git a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
index 41e7fd3c3ce90..8988e7218d1f8 100644
--- a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
+++ b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/aggregate/LocalAggregator.scala
@@ -19,10 +19,10 @@
 package org.apache.paimon.spark.aggregate
 
 import org.apache.paimon.data.BinaryRow
-import org.apache.paimon.manifest.PartitionEntry
 import org.apache.paimon.spark.SparkTypeUtils
 import org.apache.paimon.spark.data.SparkInternalRow
 import org.apache.paimon.table.{DataTable, Table}
+import org.apache.paimon.table.source.DataSplit
 import org.apache.paimon.utils.{InternalRowUtils, ProjectedRow}
 
 import org.apache.spark.sql.catalyst.InternalRow
@@ -78,13 +78,7 @@ class LocalAggregator(table: Table) {
   }
 
   def pushAggregation(aggregation: Aggregation): Boolean = {
-    if (
-      !table.isInstanceOf[DataTable] ||
-      !table.primaryKeys.isEmpty
-    ) {
-      return false
-    }
-    if (table.asInstanceOf[DataTable].coreOptions.deletionVectorsEnabled) {
+    if (!table.isInstanceOf[DataTable]) {
       return false
     }
 
@@ -108,12 +102,12 @@ class LocalAggregator(table: Table) {
     SparkInternalRow.create(partitionType).replace(genericRow)
   }
 
-  def update(partitionEntry: PartitionEntry): Unit = {
+  def update(dataSplit: DataSplit): Unit = {
     assert(isInitialized)
-    val groupByRow = requiredGroupByRow(partitionEntry.partition())
+    val groupByRow = requiredGroupByRow(dataSplit.partition())
     val aggFuncEvaluator =
       groupByEvaluatorMap.getOrElseUpdate(groupByRow, aggFuncEvaluatorGetter())
-    aggFuncEvaluator.foreach(_.update(partitionEntry))
+    aggFuncEvaluator.foreach(_.update(dataSplit))
   }
 
   def result(): Array[InternalRow] = {
@@ -147,7 +141,7 @@ class LocalAggregator(table: Table) {
 }
 
 trait AggFuncEvaluator[T] {
-  def update(partitionEntry: PartitionEntry): Unit
+  def update(dataSplit: DataSplit): Unit
   def result(): T
   def resultType: DataType
   def prettyName: String
@@ -156,8 +150,8 @@ trait AggFuncEvaluator[T] {
 class CountStarEvaluator extends AggFuncEvaluator[Long] {
   private var _result: Long = 0L
 
-  override def update(partitionEntry: PartitionEntry): Unit = {
-    _result += partitionEntry.recordCount()
+  override def update(dataSplit: DataSplit): Unit = {
+    _result += dataSplit.mergedRowCount()
   }
 
   override def result(): Long = _result
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
index ba314e3afa816..503f1c8e3e9d6 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTest.scala
@@ -18,7 +18,7 @@
 
 package org.apache.paimon.spark.sql
 
-import org.apache.paimon.spark.{PaimonBatch, PaimonInputPartition, PaimonScan, PaimonSparkTestBase, SparkTable}
+import org.apache.paimon.spark.{PaimonScan, PaimonSparkTestBase, SparkTable}
 import org.apache.paimon.table.source.DataSplit
 
 import org.apache.spark.sql.Row
@@ -29,8 +29,6 @@ import org.apache.spark.sql.connector.read.{ScanBuilder, SupportsPushDownLimit}
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.junit.jupiter.api.Assertions
 
-import scala.collection.JavaConverters._
-
 class PaimonPushDownTest extends PaimonSparkTestBase {
 
   import testImplicits._
@@ -64,7 +62,7 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
     checkAnswer(spark.sql(q), Row(1, "a", "p1") :: Nil)
 
     // case 2
-    // filter "id = '1' or pt = 'p1'" can't push down completely, it still need to be evaluated after scanning
+    // filter "id = '1' or pt = 'p1'" can't push down completely, it still needs to be evaluated after scanning
     q = "SELECT * FROM T WHERE id = '1' or pt = 'p1'"
     Assertions.assertTrue(checkEqualToFilterExists(q, "pt", Literal("p1")))
     checkAnswer(spark.sql(q), Row(1, "a", "p1") :: Row(2, "b", "p1") :: Nil)
@@ -121,7 +119,7 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
     val dataSplitsWithoutLimit = scanBuilder.build().asInstanceOf[PaimonScan].getOriginSplits
     Assertions.assertTrue(dataSplitsWithoutLimit.length >= 2)
 
-    // It still return false even it can push down limit.
+    // It still returns false even it can push down limit.
     Assertions.assertFalse(scanBuilder.asInstanceOf[SupportsPushDownLimit].pushLimit(1))
     val dataSplitsWithLimit = scanBuilder.build().asInstanceOf[PaimonScan].getOriginSplits
     Assertions.assertEquals(1, dataSplitsWithLimit.length)
@@ -169,12 +167,7 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
     // Now, we have 4 dataSplits, and 2 dataSplit is nonRawConvertible, 2 dataSplit is rawConvertible.
     Assertions.assertEquals(
       2,
-      dataSplitsWithoutLimit2
-        .filter(
-          split => {
-            split.asInstanceOf[DataSplit].rawConvertible()
-          })
-        .length)
+      dataSplitsWithoutLimit2.count(split => { split.asInstanceOf[DataSplit].rawConvertible() }))
 
     // Return 2 dataSplits.
     Assertions.assertFalse(scanBuilder2.asInstanceOf[SupportsPushDownLimit].pushLimit(2))
@@ -206,7 +199,40 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
     // Need to scan all dataSplits.
     Assertions.assertEquals(4, dataSplitsWithLimit3.length)
     Assertions.assertEquals(1, spark.sql("SELECT * FROM T LIMIT 1").count())
+  }
 
+  test("Paimon pushDown: limit for table with deletion vector") {
+    Seq(true, false).foreach(
+      deletionVectorsEnabled => {
+        Seq(true, false).foreach(
+          primaryKeyTable => {
+            withTable("T") {
+              sql(s"""
+                     |CREATE TABLE T (id INT)
+                     |TBLPROPERTIES (
+                     | 'deletion-vectors.enabled' = $deletionVectorsEnabled,
+                     | '${if (primaryKeyTable) "primary-key" else "bucket-key"}' = 'id',
+                     | 'bucket' = '10'
+                     |)
+                     |""".stripMargin)
+
+              sql("INSERT INTO T SELECT id FROM range (1, 50000)")
+              sql("DELETE FROM T WHERE id % 13 = 0")
+
+              val withoutLimit = getScanBuilder().build().asInstanceOf[PaimonScan].getOriginSplits
+              assert(withoutLimit.length == 10)
+
+              val scanBuilder = getScanBuilder().asInstanceOf[SupportsPushDownLimit]
+              scanBuilder.pushLimit(1)
+              val withLimit = scanBuilder.build().asInstanceOf[PaimonScan].getOriginSplits
+              if (deletionVectorsEnabled || !primaryKeyTable) {
+                assert(withLimit.length == 1)
+              } else {
+                assert(withLimit.length == 10)
+              }
+            }
+          })
+      })
   }
 
   test("Paimon pushDown: runtime filter") {
@@ -250,8 +276,7 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
   }
 
   private def getScanBuilder(tableName: String = "T"): ScanBuilder = {
-    new SparkTable(loadTable(tableName))
-      .newScanBuilder(CaseInsensitiveStringMap.empty())
+    SparkTable(loadTable(tableName)).newScanBuilder(CaseInsensitiveStringMap.empty())
   }
 
   private def checkFilterExists(sql: String): Boolean = {
@@ -272,5 +297,4 @@ class PaimonPushDownTest extends PaimonSparkTestBase {
       case _ => false
     }
   }
-
 }
diff --git a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
index 501e7bfb4a515..78c02644a7ced 100644
--- a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
+++ b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PushDownAggregatesTest.scala
@@ -117,22 +117,58 @@ class PushDownAggregatesTest extends PaimonSparkTestBase with AdaptiveSparkPlanH
     }
   }
 
-  test("Push down aggregate - primary table") {
-    withTable("T") {
-      spark.sql("CREATE TABLE T (c1 INT, c2 STRING) TBLPROPERTIES ('primary-key' = 'c1')")
-      runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(0) :: Nil, 2)
-      spark.sql("INSERT INTO T VALUES(1, 'x'), (2, 'x'), (3, 'x'), (3, 'x')")
-      runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(3) :: Nil, 2)
-    }
+  test("Push down aggregate - primary key table with deletion vector") {
+    Seq(true, false).foreach(
+      deletionVectorsEnabled => {
+        withTable("T") {
+          spark.sql(s"""
+                       |CREATE TABLE T (c1 INT, c2 STRING)
+                       |TBLPROPERTIES (
+                       |'primary-key' = 'c1',
+                       |'deletion-vectors.enabled' = $deletionVectorsEnabled
+                       |)
+                       |""".stripMargin)
+          runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(0) :: Nil, 0)
+
+          spark.sql("INSERT INTO T VALUES(1, 'x'), (2, 'x'), (3, 'x'), (3, 'x')")
+          runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(3) :: Nil, 0)
+
+          spark.sql("INSERT INTO T VALUES(1, 'x_1')")
+          if (deletionVectorsEnabled) {
+            runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(3) :: Nil, 0)
+          } else {
+            runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(3) :: Nil, 2)
+          }
+        }
+      })
   }
 
-  test("Push down aggregate - enable deletion vector") {
-    withTable("T") {
-      spark.sql(
-        "CREATE TABLE T (c1 INT, c2 STRING) TBLPROPERTIES('deletion-vectors.enabled' = 'true')")
-      runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(0) :: Nil, 2)
-      spark.sql("INSERT INTO T VALUES(1, 'x'), (2, 'x'), (3, 'x'), (3, 'x')")
-      runAndCheckAggregate("SELECT COUNT(*) FROM T", Row(4) :: Nil, 2)
-    }
+  test("Push down aggregate - table with deletion vector") {
+    Seq(true, false).foreach(
+      deletionVectorsEnabled => {
+        Seq(true, false).foreach(
+          primaryKeyTable => {
+            withTable("T") {
+              sql(s"""
+                     |CREATE TABLE T (id INT)
+                     |TBLPROPERTIES (
+                     | 'deletion-vectors.enabled' = $deletionVectorsEnabled,
+                     | '${if (primaryKeyTable) "primary-key" else "bucket-key"}' = 'id',
+                     | 'bucket' = '1'
+                     |)
+                     |""".stripMargin)
+
+              sql("INSERT INTO T SELECT id FROM range (0, 5000)")
+              runAndCheckAggregate("SELECT COUNT(*) FROM T", Seq(Row(5000)), 0)
+
+              sql("DELETE FROM T WHERE id > 100 and id <= 400")
+              if (deletionVectorsEnabled || !primaryKeyTable) {
+                runAndCheckAggregate("SELECT COUNT(*) FROM T", Seq(Row(4700)), 0)
+              } else {
+                runAndCheckAggregate("SELECT COUNT(*) FROM T", Seq(Row(4700)), 2)
+              }
+            }
+          })
+      })
   }
 }

Presto Data Type	Paimon Data Type	Atomic Type
`RowType`	`RowType`	false
`MapType`	`MapType`	false
`ArrayType`	`ArrayType`	false
`BooleanType`	`BooleanType`	true
`TinyintType`	`TinyIntType`	true
`SmallintType`	`SmallIntType`	true
`IntegerType`	`IntType`	true
`BigintType`	`BigIntType`	true
`RealType`	`FloatType`	true
`DoubleType`	`DoubleType`	true
`CharType(length)`	`CharType(length)`	true
`VarCharType(VarCharType.MAX_LENGTH)`	`VarCharType(VarCharType.MAX_LENGTH)`	true
`VarCharType(length)`	`VarCharType(length), length is less than VarCharType.MAX_LENGTH`	true
`DateType`	`DateType`	true
`TimestampType`	`TimestampType`	true
`DecimalType(precision, scale)`	`DecimalType(precision, scale)`	true
`VarBinaryType(length)`	`VarBinaryType(length)`	true
`TimestampWithTimeZoneType`	`LocalZonedTimestampType`	true
metadata.stats-dense-store	false	true	Boolean	Whether to store statistic densely in metadata (manifest files), which will significantly reduce the storage size of metadata when the none statistic mode is set. Note, when this mode is enabled, the Paimon sdk in reading engine requires at least version 0.9.1 or 1.0.0 or higher.	Whether to store statistic densely in metadata (manifest files), which will significantly reduce the storage size of metadata when the none statistic mode is set. Note, when this mode is enabled with 'metadata.stats-mode:none', the Paimon sdk in reading engine requires at least version 0.9.1 or 1.0.0 or higher.
metadata.stats-mode	String	hadoop-conf-dir for Iceberg Hive catalog.
metadata.iceberg.manifest-compression	gzip	String	Compression for Iceberg manifest files.
DataType	Description
`BOOLEAN`	`Data type of a boolean with a (possibly) three-valued logic of TRUE, FALSE, and UNKNOWN.`
`CHAR` + `CHAR(n)` +	`Data type of a fixed-length character string.` + `The type can be declared using CHAR(n) where n is the number of code points. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.` +
`VARCHAR` + `VARCHAR(n)` + `STRING` +	`Data type of a variable-length character string.` + `The type can be declared using VARCHAR(n) where n is the maximum number of code points. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.` + `STRING is a synonym for VARCHAR(2147483647).` +
`BINARY` + `BINARY(n)` +	`Data type of a fixed-length binary string (=a sequence of bytes).` + `The type can be declared using BINARY(n) where n is the number of bytes. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.` +
`VARBINARY` + `VARBINARY(n)` + `BYTES` +	`Data type of a variable-length binary string (=a sequence of bytes).` + `The type can be declared using VARBINARY(n) where n is the maximum number of bytes. n must have a value between 1 and 2,147,483,647 (both inclusive). If no length is specified, n is equal to 1.` + `BYTES is a synonym for VARBINARY(2147483647).` +
`DECIMAL` + `DECIMAL(p)` + `DECIMAL(p, s)` +	`Data type of a decimal number with fixed precision and scale.` + `The type can be declared using DECIMAL(p, s) where p is the number of digits in a number (precision) and s is the number of digits to the right of the decimal point in a number (scale). p must have a value between 1 and 38 (both inclusive). s must have a value between 0 and p (both inclusive). The default value for p is 10. The default value for s is 0.` +
`TINYINT`	`Data type of a 1-byte signed integer with values from -128 to 127.`
`SMALLINT`	`Data type of a 2-byte signed integer with values from -32,768 to 32,767.`
`INT`	`Data type of a 4-byte signed integer with values from -2,147,483,648 to 2,147,483,647.`
`BIGINT`	`Data type of an 8-byte signed integer with values from -9,223,372,036,854,775,808 to 9,223,372,036,854,775,807.`
`FLOAT`	`Data type of a 4-byte single precision floating point number.` + `Compared to the SQL standard, the type does not take parameters.` +
`DOUBLE`	`Data type of an 8-byte double precision floating point number.`
`DATE`	`Data type of a date consisting of year-month-day with values ranging from 0000-01-01 to 9999-12-31.` + `Compared to the SQL standard, the range starts at year 0000.` +
`TIME` + `TIME(p)` +	`Data type of a time without time zone consisting of hour:minute:second[.fractional] with up to nanosecond precision and values ranging from 00:00:00.000000000 to 23:59:59.999999999.` + `The type can be declared using TIME(p) where p is the number of digits of fractional seconds (precision). p must have a value between 0 and 9 (both inclusive). If no precision is specified, p is equal to 0.` +
`TIMESTAMP` + `TIMESTAMP(p)` +	`Data type of a timestamp without time zone consisting of year-month-day hour:minute:second[.fractional] with up to nanosecond precision and values ranging from 0000-01-01 00:00:00.000000000 to 9999-12-31 23:59:59.999999999.` + `The type can be declared using TIMESTAMP(p) where p is the number of digits of fractional seconds (precision). p must have a value between 0 and 9 (both inclusive). If no precision is specified, p is equal to 6.` +
`TIMESTAMP WITH TIME ZONE` + `TIMESTAMP(p) WITH TIME ZONE` +	`Data type of a timestamp with time zone consisting of year-month-day hour:minute:second[.fractional] zone with up to nanosecond precision and values ranging from 0000-01-01 00:00:00.000000000 +14:59 to 9999-12-31 23:59:59.999999999 -14:59.` + `This type fills the gap between time zone free and time zone mandatory timestamp types by allowing the interpretation of UTC timestamps according to the configured session time zone. A conversion from and to int describes the number of seconds since epoch. A conversion from and to long describes the number of milliseconds since epoch.` +
`ARRAY<t>`	`Data type of an array of elements with same subtype.` + `Compared to the SQL standard, the maximum cardinality of an array cannot be specified but is fixed at 2,147,483,647. Also, any valid type is supported as a subtype.` + `The type can be declared using ARRAY<t> where t is the data type of the contained elements.` +
`MAP<kt, vt>`	`Data type of an associative array that maps keys (including NULL) to values (including NULL). A map cannot contain duplicate keys; each key can map to at most one value.` + `There is no restriction of element types; it is the responsibility of the user to ensure uniqueness.` + `The type can be declared using MAP<kt, vt> where kt is the data type of the key elements and vt is the data type of the value elements.` +
`MULTISET<t>`	`Data type of a multiset (=bag). Unlike a set, it allows for multiple instances for each of its elements with a common subtype. Each unique value (including NULL) is mapped to some multiplicity.` + `There is no restriction of element types; it is the responsibility of the user to ensure uniqueness.` + `The type can be declared using MULTISET<t> where t is the data type of the contained elements.` +
`ROW<n0 t0, n1 t1, ...>` + `ROW<n0 t0 'd0', n1 t1 'd1', ...>` +	`Data type of a sequence of fields.` + `A field consists of a field name, field type, and an optional description. The most specific type of a row of a table is a row type. In this case, each column of the row corresponds to the field of the row type that has the same ordinal position as the column.` + `Compared to the SQL standard, an optional field description simplifies the handling with complex structures.` + `A row type is similar to the STRUCT type known from other non-standard-compliant frameworks.` + `The type can be declared using ROW<n0 t0 'd0', n1 t1 'd1', ...> where n is the unique name of a field, t is the logical type of a field, d is the description of a field.` +