apache
diff --git a/‎paimon-common/src/main/java/org/apache/paimon/reader/DataEvolutionFileReader.java‎
Lines changed: 9 additions & 0 deletions b/‎paimon-common/src/main/java/org/apache/paimon/reader/DataEvolutionFileReader.java‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎paimon-common/src/main/java/org/apache/paimon/reader/DataEvolutionFileRecordIterator.java‎
Lines changed: 53 additions & 0 deletions b/‎paimon-common/src/main/java/org/apache/paimon/reader/DataEvolutionFileRecordIterator.java‎
Lines changed: 53 additions & 0 deletions
diff --git a/‎paimon-core/src/main/java/org/apache/paimon/append/ForceSingleBatchReader.java‎
Lines changed: 51 additions & 3 deletions b/‎paimon-core/src/main/java/org/apache/paimon/append/ForceSingleBatchReader.java‎
Lines changed: 51 additions & 3 deletions
diff --git a/‎paimon-core/src/main/java/org/apache/paimon/operation/commit/ConflictDetection.java‎
Lines changed: 64 additions & 13 deletions b/‎paimon-core/src/main/java/org/apache/paimon/operation/commit/ConflictDetection.java‎
Lines changed: 64 additions & 13 deletions
diff --git a/‎paimon-core/src/test/java/org/apache/paimon/operation/commit/ConflictDetectionTest.java‎
Lines changed: 37 additions & 0 deletions b/‎paimon-core/src/test/java/org/apache/paimon/operation/commit/ConflictDetectionTest.java‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/RowTrackingTest.scala‎
Lines changed: 23 additions & 0 deletions b/‎paimon-spark/paimon-spark-3.5/src/test/scala/org/apache/paimon/spark/sql/RowTrackingTest.scala‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/RowTrackingTest.scala‎
Lines changed: 61 additions & 1 deletion b/‎paimon-spark/paimon-spark-4.0/src/test/scala/org/apache/paimon/spark/sql/RowTrackingTest.scala‎
Lines changed: 61 additions & 1 deletion
@@ -89,6 +89,15 @@ public RecordIterator<InternalRow> readBatch() throws IOException {
                 iterators[i] = batch;
             }
         }
+        // Expose file path and position when possible so callers that need per-row file
+        // metadata (e.g. Spark metadata columns and copy-on-write group filtering) can treat
+        // the assembled row as coming from one deterministic member file of the row-id group.
+        for (RecordIterator<InternalRow> iterator : iterators) {
+            if (iterator instanceof FileRecordIterator) {
+                return new DataEvolutionFileRecordIterator(
+                        row, iterators, (FileRecordIterator<InternalRow>) iterator);
+            }
+        }
         return new DataEvolutionIterator(row, iterators);
     }
 
 
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.reader;
+
+import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.reader.RecordReader.RecordIterator;
+
+/**
+ * A {@link DataEvolutionIterator} that is also a {@link FileRecordIterator}. The file path and
+ * returned position are delegated to one designated inner iterator, so a row assembled from
+ * multiple files reports one deterministic member file of its row-id group and its position within
+ * that group (all inner iterators are row-aligned).
+ */
+public class DataEvolutionFileRecordIterator extends DataEvolutionIterator
+        implements FileRecordIterator<InternalRow> {
+
+    private final FileRecordIterator<InternalRow> designated;
+
+    public DataEvolutionFileRecordIterator(
+            DataEvolutionRow row,
+            RecordIterator<InternalRow>[] iterators,
+            FileRecordIterator<InternalRow> designated) {
+        super(row, iterators);
+        this.designated = designated;
+    }
+
+    @Override
+    public long returnedPosition() {
+        return designated.returnedPosition();
+    }
+
+    @Override
+    public Path filePath() {
+        return designated.filePath();
+    }
+}
@@ -19,11 +19,15 @@
 package org.apache.paimon.append;
 
 import org.apache.paimon.data.InternalRow;
+import org.apache.paimon.fs.Path;
+import org.apache.paimon.reader.FileRecordIterator;
+import org.apache.paimon.reader.FileRecordReader;
 import org.apache.paimon.reader.RecordReader;
 
 import javax.annotation.Nullable;
 
 import java.io.IOException;
+import java.io.UncheckedIOException;
 
 /**
  * A record reader that merges all batches from a multi-batch reader into a single concatenated
@@ -53,7 +57,13 @@ public class ForceSingleBatchReader implements RecordReader<InternalRow> {
 
     public ForceSingleBatchReader(RecordReader<InternalRow> multiBatchReader) {
         this.multiBatchReader = multiBatchReader;
-        this.batch = new ConcatBatch(multiBatchReader);
+        // Preserve the file-record capability of the wrapped reader: callers like the
+        // data-evolution union read rely on per-row file path and position (e.g. Spark's
+        // __paimon_file_path metadata column and copy-on-write group filtering).
+        this.batch =
+                multiBatchReader instanceof FileRecordReader
+                        ? new FileConcatBatch(multiBatchReader)
+                        : new ConcatBatch(multiBatchReader);
     }
 
     @Override
@@ -71,8 +81,8 @@ public void close() throws IOException {
 
     private static class ConcatBatch implements RecordIterator<InternalRow> {
 
-        private final RecordReader<InternalRow> reader;
-        private RecordIterator<InternalRow> currentBatch;
+        protected final RecordReader<InternalRow> reader;
+        protected RecordIterator<InternalRow> currentBatch;
 
         private ConcatBatch(RecordReader<InternalRow> reader) {
             this.reader = reader;
@@ -107,4 +117,42 @@ public void releaseBatch() {
             }
         }
     }
+
+    /**
+     * A {@link ConcatBatch} over a {@link FileRecordReader}, exposing the file path and returned
+     * position of the batch that produced the current row. Callers may ask for the file path before
+     * the first {@link #next()}, so the first underlying batch is loaded on demand.
+     */
+    private static class FileConcatBatch extends ConcatBatch
+            implements FileRecordIterator<InternalRow> {
+
+        private FileConcatBatch(RecordReader<InternalRow> reader) {
+            super(reader);
+        }
+
+        @Override
+        public long returnedPosition() {
+            return currentFileBatch().returnedPosition();
+        }
+
+        @Override
+        public Path filePath() {
+            return currentFileBatch().filePath();
+        }
+
+        private FileRecordIterator<InternalRow> currentFileBatch() {
+            if (currentBatch == null) {
+                try {
+                    currentBatch = reader.readBatch();
+                } catch (IOException e) {
+                    throw new UncheckedIOException(e);
+                }
+                if (currentBatch == null) {
+                    throw new IllegalStateException(
+                            "The file batch is exhausted, file path and position are unavailable.");
+                }
+            }
+            return (FileRecordIterator<InternalRow>) currentBatch;
+        }
+    }
 }
@@ -643,30 +643,81 @@ Optional<RuntimeException> checkRowIdExistence(
                         .collect(Collectors.toList());
         RowRangeIndex existingIndex = RowRangeIndex.create(existingRanges, false);
 
+        // Row-id ranges removed by this same commit, keyed by partition and bucket. A
+        // copy-on-write update on a data-evolution table deletes whole row-id groups and re-adds
+        // rewritten rows with their original row ids. File rolling may make an added file cover
+        // only a sub-range of a deleted group and not mirror an existing file exactly; it is still
+        // consistent as long as its range is fully covered by ranges deleted in this commit
+        // (concurrent rewrites of those files are caught by the regular deleted-file conflict
+        // checks).
+        Map<Pair<BinaryRow, Integer>, List<Range>> deletedRanges = new HashMap<>();
+        for (SimpleFileEntry entry : deltaEntries) {
+            if (entry.kind() == FileKind.DELETE && entry.firstRowId() != null) {
+                deletedRanges
+                        .computeIfAbsent(
+                                Pair.of(entry.partition(), entry.bucket()), k -> new ArrayList<>())
+                        .add(
+                                new Range(
+                                        entry.firstRowId(),
+                                        entry.firstRowId() + entry.rowCount() - 1));
+            }
+        }
+
         for (SimpleFileEntry entry : filesToCheck) {
             Range rowRange = entry.nonNullRowIdRange();
             boolean exists =
                     dedicatedStorageFile(entry.fileName())
                             ? existingIndex.contains(rowRange)
                             : existingIndex.containsExactly(rowRange);
-            if (!exists) {
-                return Optional.of(
-                        new RuntimeException(
-                                String.format(
-                                        "Row ID existence conflict: file '%s' references "
-                                                + "firstRowId=%d, rowCount=%d in bucket %d, "
-                                                + "but no matching file exists in the current snapshot. "
-                                                + "The referenced file may have been rewritten by a "
-                                                + "concurrent compaction or removed by an overwrite.",
-                                        entry.fileName(),
-                                        entry.firstRowId(),
-                                        entry.rowCount(),
-                                        entry.bucket())));
+            if (exists) {
+                continue;
             }
+            List<Range> deleted = deletedRanges.get(Pair.of(entry.partition(), entry.bucket()));
+            if (coveredByRanges(
+                    deleted, entry.firstRowId(), entry.firstRowId() + entry.rowCount() - 1)) {
+                continue;
+            }
+            return Optional.of(
+                    new RuntimeException(
+                            String.format(
+                                    "Row ID existence conflict: file '%s' references "
+                                            + "firstRowId=%d, rowCount=%d in bucket %d, "
+                                            + "but no matching file exists in the current snapshot. "
+                                            + "The referenced file may have been rewritten by a "
+                                            + "concurrent compaction or removed by an overwrite.",
+                                    entry.fileName(),
+                                    entry.firstRowId(),
+                                    entry.rowCount(),
+                                    entry.bucket())));
         }
         return Optional.empty();
     }
 
+    /** Whether {@code [from, to]} is fully covered by the union of the given ranges. */
+    private static boolean coveredByRanges(@Nullable List<Range> ranges, long from, long to) {
+        if (ranges == null || ranges.isEmpty()) {
+            return false;
+        }
+        // Sort a copy: the per-bucket lists are held in the caller's deletedRanges map and may be
+        // probed by more than one file, so an existence check must not reorder them in place.
+        List<Range> sorted = new ArrayList<>(ranges);
+        sorted.sort(Comparator.comparingLong(range -> range.from));
+        long cursor = from;
+        for (Range range : sorted) {
+            if (range.to < cursor) {
+                continue;
+            }
+            if (range.from > cursor) {
+                return false;
+            }
+            cursor = range.to + 1;
+            if (cursor > to) {
+                return true;
+            }
+        }
+        return cursor > to;
+    }
+
     private static boolean dedicatedStorageFile(String fileName) {
         return isBlobFile(fileName) || isVectorStoreFile(fileName);
     }
 
@@ -533,6 +533,43 @@ void testCheckRowIdExistenceDedicatedFileIgnoresBaseDedicatedFiles() {
         assertThat(result.get().getMessage()).contains("Row ID existence conflict");
     }
 
+    @Test
+    void testCheckRowIdExistenceAcceptsSubRangeCoveredBySameCommitDeletes() {
+        ConflictDetection detection = createConflictDetection();
+
+        List<SimpleFileEntry> baseEntries = new ArrayList<>();
+        baseEntries.add(createFileEntryWithRowId("f1", ADD, 0L, 100L));
+
+        // Copy-on-write update: the whole group [0, 100) is deleted and the rewritten rows are
+        // re-added as sub-range files [0, 40) and [50, 100) with their original row ids.
+        List<SimpleFileEntry> deltaEntries = new ArrayList<>();
+        deltaEntries.add(createFileEntryWithRowId("f1", DELETE, 0L, 100L));
+        deltaEntries.add(createFileEntryWithRowId("p1", ADD, 0L, 40L));
+        deltaEntries.add(createFileEntryWithRowId("p2", ADD, 50L, 50L));
+
+        assertThat(detection.checkRowIdExistence(baseEntries, deltaEntries, 100L)).isEmpty();
+    }
+
+    @Test
+    void testCheckRowIdExistenceRejectsSubRangeNotCoveredBySameCommitDeletes() {
+        ConflictDetection detection = createConflictDetection();
+
+        List<SimpleFileEntry> baseEntries = new ArrayList<>();
+        baseEntries.add(createFileEntryWithRowId("f1", ADD, 0L, 100L));
+        baseEntries.add(createFileEntryWithRowId("f2", ADD, 100L, 100L));
+
+        // The added file [50, 150) spills past the deleted group [0, 100): rows of f2 are
+        // re-added without deleting f2, which would duplicate row ids.
+        List<SimpleFileEntry> deltaEntries = new ArrayList<>();
+        deltaEntries.add(createFileEntryWithRowId("f1", DELETE, 0L, 100L));
+        deltaEntries.add(createFileEntryWithRowId("p1", ADD, 50L, 100L));
+
+        Optional<RuntimeException> result =
+                detection.checkRowIdExistence(baseEntries, deltaEntries, 200L);
+        assertThat(result).isPresent();
+        assertThat(result.get().getMessage()).contains("Row ID existence conflict");
+    }
+
     @Test
     void testCheckRowIdExistenceSkipsNewlyAppendedFiles() {
         ConflictDetection detection = createConflictDetection();
 
@@ -35,4 +35,27 @@ class RowTrackingTest extends RowTrackingTestBase {
       }
     }
   }
+
+  test("Data Evolution: Spark 3.5 keeps data-evolution tables off the V2 row-level path") {
+    withSparkSQLConf("spark.paimon.write.use-v2-write" -> "true") {
+      withTable("t") {
+        sql(
+          "CREATE TABLE t (id INT, data INT) TBLPROPERTIES " +
+            "('row-tracking.enabled' = 'true', 'data-evolution.enabled' = 'true')")
+        assert(!SparkTable.of(loadTable("t")).isInstanceOf[SupportsRowLevelOperations])
+
+        sql("INSERT INTO t VALUES (1, 1), (2, 2)")
+        assert(
+          intercept[RuntimeException] {
+            sql("DELETE FROM t WHERE id = 2")
+          }.getMessage
+            .contains("Delete operation is not supported when data evolution is enabled yet."))
+        assert(
+          intercept[RuntimeException] {
+            sql("UPDATE t SET data = 20 WHERE id = 2")
+          }.getMessage
+            .contains("Update operation is not supported when data evolution is enabled yet."))
+      }
+    }
+  }
 }
@@ -18,4 +18,64 @@
 
 package org.apache.paimon.spark.sql
 
-class RowTrackingTest extends RowTrackingTestBase {}
+import org.apache.spark.sql.Row
+
+class RowTrackingTest extends RowTrackingTestBase {
+
+  test("Data Evolution: Spark 4.0 uses V2 copy-on-write for UPDATE") {
+    withSparkSQLConf("spark.paimon.write.use-v2-write" -> "true") {
+      withTable("t") {
+        sql(
+          "CREATE TABLE t (id INT, data INT) TBLPROPERTIES " +
+            "('row-tracking.enabled' = 'true', 'data-evolution.enabled' = 'true')")
+        sql("INSERT INTO t SELECT /*+ REPARTITION(1) */ * FROM VALUES (1, 1), (2, 2)")
+        sql("INSERT INTO t SELECT /*+ REPARTITION(1) */ * FROM VALUES (3, 3), (4, 4)")
+
+        sql("UPDATE t SET data = 30 WHERE id = 3")
+        checkAnswer(
+          sql("SELECT *, _ROW_ID FROM t ORDER BY id"),
+          Seq(Row(1, 1, 0), Row(2, 2, 1), Row(3, 30, 2), Row(4, 4, 3))
+        )
+      }
+    }
+  }
+
+  test("Data Evolution: DELETE remains unsupported") {
+    withSparkSQLConf("spark.paimon.write.use-v2-write" -> "true") {
+      withTable("t") {
+        sql(
+          "CREATE TABLE t (id INT, data INT) TBLPROPERTIES " +
+            "('row-tracking.enabled' = 'true', 'data-evolution.enabled' = 'true')")
+        sql("INSERT INTO t VALUES (1, 1), (2, 2)")
+
+        assert(
+          intercept[Exception] {
+            sql("DELETE FROM t WHERE id = 2")
+          }.getMessage
+            .contains("Delete operation is not supported when data evolution is enabled yet"))
+      }
+    }
+  }
+
+  test("Data Evolution: partition column update is rejected") {
+    withSparkSQLConf("spark.paimon.write.use-v2-write" -> "true") {
+      withTable("t") {
+        sql("""
+              |CREATE TABLE t (id INT, data INT, dt STRING)
+              |PARTITIONED BY (dt)
+              |TBLPROPERTIES ('row-tracking.enabled' = 'true', 'data-evolution.enabled' = 'true')
+              |""".stripMargin)
+        sql("INSERT INTO t VALUES (1, 1, 'p1'), (2, 2, 'p2')")
+
+        assert(
+          intercept[Exception] {
+            sql("UPDATE t SET dt = 'p3' WHERE id = 1")
+          }.getMessage
+            .contains("Update to partition columns is not supported for data evolution tables"))
+
+        sql("UPDATE t SET data = 10 WHERE id = 1")
+        checkAnswer(sql("SELECT * FROM t ORDER BY id"), Seq(Row(1, 10, "p1"), Row(2, 2, "p2")))
+      }
+    }
+  }
+}
Original file line number	Diff line number	Diff line change
`@@ -89,6 +89,15 @@ public RecordIterator<InternalRow> readBatch() throws IOException {`
`89`	`89`	`iterators[i] = batch;`
`90`	`90`	`}`
`91`	`91`	`}`
	`92`	`+ // Expose file path and position when possible so callers that need per-row file`
	`93`	`+ // metadata (e.g. Spark metadata columns and copy-on-write group filtering) can treat`
	`94`	`+ // the assembled row as coming from one deterministic member file of the row-id group.`
	`95`	`+ for (RecordIterator<InternalRow> iterator : iterators) {`
	`96`	`+ if (iterator instanceof FileRecordIterator) {`
	`97`	`+ return new DataEvolutionFileRecordIterator(`
	`98`	`+ row, iterators, (FileRecordIterator<InternalRow>) iterator);`
	`99`	`+ }`
	`100`	`+ }`
`92`	`101`	`return new DataEvolutionIterator(row, iterators);`
`93`	`102`	`}`
`94`	`103`