apache
diff --git a/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogFetcher.java‎
Lines changed: 7 additions & 1 deletion b/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogFetcher.java‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogScannerImpl.java‎
Lines changed: 3 additions & 1 deletion b/‎fluss-client/src/main/java/org/apache/fluss/client/table/scanner/log/LogScannerImpl.java‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎fluss-client/src/main/java/org/apache/fluss/client/write/RecordAccumulator.java‎
Lines changed: 117 additions & 1 deletion b/‎fluss-client/src/main/java/org/apache/fluss/client/write/RecordAccumulator.java‎
Lines changed: 117 additions & 1 deletion
diff --git a/‎fluss-client/src/main/java/org/apache/fluss/client/write/VariantShreddingManager.java‎
Lines changed: 199 additions & 0 deletions b/‎fluss-client/src/main/java/org/apache/fluss/client/write/VariantShreddingManager.java‎
Lines changed: 199 additions & 0 deletions
@@ -528,9 +528,15 @@ Map<Integer, FetchLogRequest> prepareFetchLogRequests() {
                                 new PbFetchLogReqForTable().setTableId(finalTableId);
                         if (readContext.isProjectionPushDowned()) {
                             assert projection != null;
+                            // When shredding is enabled, use the expanded projection
+                            // that includes shredded columns for the server request
+                            int[] projectedFields =
+                                    readContext.getStorageProjectionInOrder() != null
+                                            ? readContext.getStorageProjectionInOrder()
+                                            : projection.getProjectionInOrder();
                             reqForTable
                                     .setProjectionPushdownEnabled(true)
-                                    .setProjectedFields(projection.getProjectionInOrder());
+                                    .setProjectedFields(projectedFields);
                         } else {
                             reqForTable.setProjectionPushdownEnabled(false);
                         }
 
@@ -112,7 +112,9 @@ public LogScannerImpl(
      */
     @Nullable
     private Projection sanityProjection(@Nullable int[] projectedFields, TableInfo tableInfo) {
-        RowType tableRowType = tableInfo.getRowType();
+        // Validate against the user-visible row type (excludes internal shredded columns like $v.x)
+        // so that projection indices from callers (e.g. Flink) stay within user-visible bounds.
+        RowType tableRowType = tableInfo.getUserRowType();
         if (projectedFields != null) {
             for (int projectedField : projectedFields) {
                 if (projectedField < 0 || projectedField >= tableRowType.getFieldCount()) {
 
@@ -33,10 +33,13 @@
 import org.apache.fluss.metadata.TableInfo;
 import org.apache.fluss.metrics.MetricNames;
 import org.apache.fluss.record.LogRecordBatchStatisticsCollector;
+import org.apache.fluss.row.InternalRow;
 import org.apache.fluss.row.arrow.ArrowWriter;
 import org.apache.fluss.row.arrow.ArrowWriterPool;
+import org.apache.fluss.rpc.gateway.CoordinatorGateway;
 import org.apache.fluss.shaded.arrow.org.apache.arrow.memory.BufferAllocator;
 import org.apache.fluss.shaded.arrow.org.apache.arrow.memory.RootAllocator;
+import org.apache.fluss.types.variant.ShreddingSchemaInferrer;
 import org.apache.fluss.utils.CopyOnWriteMap;
 import org.apache.fluss.utils.MathUtils;
 import org.apache.fluss.utils.clock.Clock;
@@ -113,6 +116,19 @@ public final class RecordAccumulator {
     private final Clock clock;
     private final DynamicWriteBatchSizeEstimator batchSizeEstimator;
 
+    /**
+     * Optional Coordinator gateway used to send {@code ApplyShreddingSchema} RPCs. Set after
+     * construction via {@link #setCoordinatorGateway(CoordinatorGateway)}.
+     */
+    @Nullable private volatile CoordinatorGateway coordinatorGateway;
+
+    /**
+     * Per-table {@link VariantShreddingManager}s. Created lazily on first append to an ARROW_LOG
+     * table with Variant shredding enabled and at least one Variant column.
+     */
+    private final ConcurrentMap<PhysicalTablePath, VariantShreddingManager> shreddingManagers =
+            new CopyOnWriteMap<>();
+
     // TODO add retryBackoffMs to retry the produce request upon receiving an error.
     // TODO add deliveryTimeoutMs to report success or failure on record delivery.
     // TODO add nextBatchExpiryTimeMs
@@ -158,6 +174,91 @@ private void registerMetrics(WriterMetricGroup writerMetricGroup) {
                 MetricNames.WRITER_BUFFER_WAITING_THREADS, writerBufferPool::queued);
     }
 
+    /**
+     * Sets the {@link CoordinatorGateway} to use for Variant shredding schema evolution RPCs.
+     *
+     * <p>This must be called once after the accumulator is constructed (and after the coordinator
+     * server is known) to enable automatic shredding. If not called, Variant statistics will still
+     * be collected locally but no schema evolution RPC will be fired.
+     */
+    public void setCoordinatorGateway(CoordinatorGateway gateway) {
+        this.coordinatorGateway = gateway;
+    }
+
+    /**
+     * Collects Variant statistics for the row being appended, and — once enough samples have been
+     * observed — fires an async schema-evolution RPC to the Coordinator.
+     *
+     * <p>This method is a no-op when:
+     *
+     * <ul>
+     *   <li>the write format is not {@link WriteFormat#ARROW_LOG}
+     *   <li>the table has no Variant columns
+     *   <li>Variant shredding is disabled in the table's configuration
+     *   <li>the coordinator gateway has not been set
+     * </ul>
+     */
+    private void maybeCollectVariantStats(
+            PhysicalTablePath physicalTablePath,
+            TableInfo tableInfo,
+            WriteFormat writeFormat,
+            InternalRow row) {
+        if (coordinatorGateway == null) {
+            return;
+        }
+        if (writeFormat != WriteFormat.ARROW_LOG) {
+            return;
+        }
+        if (!tableInfo.isVariantShreddingEnabled()) {
+            return;
+        }
+        int[] variantIndices = tableInfo.getVariantColumnIndices();
+        if (variantIndices.length == 0) {
+            return;
+        }
+
+        VariantShreddingManager manager =
+                shreddingManagers.computeIfAbsent(
+                        physicalTablePath,
+                        path -> {
+                            String[] colNames = new String[variantIndices.length];
+                            for (int i = 0; i < variantIndices.length; i++) {
+                                colNames[i] =
+                                        tableInfo
+                                                .getRowType()
+                                                .getFields()
+                                                .get(variantIndices[i])
+                                                .getName();
+                            }
+                            ShreddingSchemaInferrer inferrer =
+                                    new ShreddingSchemaInferrer()
+                                            .setPresenceThreshold(
+                                                    tableInfo
+                                                            .getTableConfig()
+                                                            .getVariantShreddingPresenceThreshold())
+                                            .setTypeConsistencyThreshold(
+                                                    tableInfo
+                                                            .getTableConfig()
+                                                            .getVariantShreddingTypeConsistencyThreshold())
+                                            .setMaxShreddedFields(
+                                                    tableInfo
+                                                            .getTableConfig()
+                                                            .getVariantShreddingMaxFields())
+                                            .setMinSampleSize(
+                                                    tableInfo
+                                                            .getTableConfig()
+                                                            .getVariantShreddingMinSampleSize());
+                            CoordinatorGateway gw = coordinatorGateway;
+                            return new VariantShreddingManager(
+                                    path.getTablePath(),
+                                    variantIndices,
+                                    colNames,
+                                    inferrer,
+                                    gw::applyShreddingSchema);
+                        });
+        manager.collectRow(row);
+    }
+
     /**
      * Add a record to the accumulator, return to append result.
      *
@@ -195,6 +296,12 @@ public RecordAppendResult append(
             synchronized (dq) {
                 RecordAppendResult appendResult = tryAppend(writeRecord, callback, dq);
                 if (appendResult != null) {
+                    // Row was appended to an existing batch; collect Variant statistics.
+                    maybeCollectVariantStats(
+                            physicalTablePath,
+                            tableInfo,
+                            writeRecord.getWriteFormat(),
+                            writeRecord.getRow());
                     return appendResult;
                 }
             }
@@ -212,6 +319,12 @@ public RecordAppendResult append(
                                 writeRecord, callback, bucketId, tableInfo, dq, memorySegments);
                 if (appendResult.newBatchCreated) {
                     memorySegments = Collections.emptyList();
+                    // Row was appended to the new batch; collect Variant statistics.
+                    maybeCollectVariantStats(
+                            physicalTablePath,
+                            tableInfo,
+                            writeRecord.getWriteFormat(),
+                            writeRecord.getRow());
                 }
                 return appendResult;
             }
@@ -628,7 +741,10 @@ private WriteBatch createWriteBatch(
                                 schemaId,
                                 outputView.getPreAllocatedSize(),
                                 tableInfo.getRowType(),
-                                tableInfo.getTableConfig().getArrowCompressionInfo());
+                                tableInfo.getTableConfig().getArrowCompressionInfo(),
+                                tableInfo.getShreddingSchemas().isEmpty()
+                                        ? null
+                                        : tableInfo.getShreddingSchemas());
                 LogRecordBatchStatisticsCollector statisticsCollector = null;
                 if (tableInfo.isStatisticsEnabled()) {
                     statisticsCollector =
 
@@ -0,0 +1,199 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.fluss.client.write;
+
+import org.apache.fluss.annotation.Internal;
+import org.apache.fluss.metadata.TablePath;
+import org.apache.fluss.row.InternalRow;
+import org.apache.fluss.rpc.messages.ApplyShreddingSchemaRequest;
+import org.apache.fluss.rpc.messages.ApplyShreddingSchemaResponse;
+import org.apache.fluss.rpc.messages.PbTablePath;
+import org.apache.fluss.types.variant.ShreddingSchema;
+import org.apache.fluss.types.variant.ShreddingSchemaInferrer;
+import org.apache.fluss.types.variant.Variant;
+import org.apache.fluss.types.variant.VariantStatisticsCollector;
+
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.function.Function;
+
+/**
+ * Manages automatic Variant shredding inference for a single table on the client write path.
+ *
+ * <p>Each time a row is appended to a write batch ({@link #collectRow(InternalRow)}), this manager
+ * extracts the Variant values from the row's Variant-typed columns and feeds them into per-column
+ * {@link VariantStatisticsCollector}s. Once the minimum sample threshold is met and a non-empty
+ * {@link ShreddingSchema} is inferred, an asynchronous RPC is dispatched to the Coordinator to
+ * trigger server-side schema evolution.
+ *
+ * <p>Schema evolution is triggered <em>at most once</em> per manager instance. If the RPC fails
+ * (e.g., transient network error), the {@link #schemaTriggered} flag is reset to allow a retry on
+ * the next collected row.
+ *
+ * <p>Thread safety: {@link #collectRow} is called from the writer thread and is guarded by the
+ * deque lock in {@link RecordAccumulator}. The {@link #schemaTriggered} flag is an {@link
+ * AtomicBoolean} so it can safely be reset from the RPC callback thread.
+ */
+@Internal
+public class VariantShreddingManager {
+
+    private static final Logger LOG = LoggerFactory.getLogger(VariantShreddingManager.class);
+
+    private final TablePath tablePath;
+
+    /**
+     * Column indices (into the row's schema) of all Variant-typed columns. Each index maps to the
+     * corresponding {@link VariantStatisticsCollector} in {@link #collectors} at the same array
+     * position.
+     */
+    private final int[] variantColumnIndices;
+
+    /**
+     * Names of the Variant columns, used to construct the column-name-based {@link
+     * ShreddingSchema}.
+     */
+    private final String[] variantColumnNames;
+
+    /** One statistics collector per Variant column. */
+    private final VariantStatisticsCollector[] collectors;
+
+    /** Inferrer, configured from the table's shredding options. */
+    private final ShreddingSchemaInferrer inferrer;
+
+    /**
+     * Guards against duplicate schema evolution RPCs. Set to {@code true} when an RPC is in flight;
+     * reset to {@code false} on RPC failure so the next {@link #collectRow} call can retry.
+     */
+    private final AtomicBoolean schemaTriggered = new AtomicBoolean(false);
+
+    /**
+     * Callback that sends the {@link ApplyShreddingSchemaRequest} to the Coordinator and returns a
+     * future. Injected by {@link RecordAccumulator} so this class does not depend on a concrete RPC
+     * client.
+     */
+    private final Function<
+                    ApplyShreddingSchemaRequest, CompletableFuture<ApplyShreddingSchemaResponse>>
+            rpcCaller;
+
+    public VariantShreddingManager(
+            TablePath tablePath,
+            int[] variantColumnIndices,
+            String[] variantColumnNames,
+            ShreddingSchemaInferrer inferrer,
+            Function<ApplyShreddingSchemaRequest, CompletableFuture<ApplyShreddingSchemaResponse>>
+                    rpcCaller) {
+        this.tablePath = tablePath;
+        this.variantColumnIndices = variantColumnIndices;
+        this.variantColumnNames = variantColumnNames;
+        this.inferrer = inferrer;
+        this.rpcCaller = rpcCaller;
+
+        this.collectors = new VariantStatisticsCollector[variantColumnIndices.length];
+        for (int i = 0; i < variantColumnIndices.length; i++) {
+            this.collectors[i] = new VariantStatisticsCollector();
+        }
+    }
+
+    /**
+     * Collects statistics from one row that is about to be (or has just been) written.
+     *
+     * <p>This method extracts the Variant value at each variant-column index from {@code row} and
+     * feeds it into the corresponding {@link VariantStatisticsCollector}. If the inferrer produces
+     * a non-empty schema for any column, {@link #triggerSchemaEvolution} is called.
+     *
+     * @param row the row being written
+     */
+    public void collectRow(InternalRow row) {
+        if (schemaTriggered.get()) {
+            return;
+        }
+
+        for (int c = 0; c < variantColumnIndices.length; c++) {
+            int colIdx = variantColumnIndices[c];
+            Variant variant = row.isNullAt(colIdx) ? null : row.getVariant(colIdx);
+            collectors[c].collect(variant);
+        }
+
+        maybeInferAndTrigger();
+    }
+
+    // --------------------------------------------------------------------------------------------
+    // Internal helpers
+    // --------------------------------------------------------------------------------------------
+
+    private void maybeInferAndTrigger() {
+        for (int c = 0; c < variantColumnIndices.length; c++) {
+            VariantStatisticsCollector collector = collectors[c];
+            long totalRecords = collector.getTotalRecords();
+
+            // Skip inference until we have enough samples to be statistically meaningful.
+            // This avoids creating empty ShreddingSchema objects on every row.
+            if (totalRecords < inferrer.getMinSampleSize()) {
+                continue;
+            }
+
+            ShreddingSchema schema =
+                    inferrer.infer(variantColumnNames[c], collector.getStatistics(), totalRecords);
+            if (!schema.getFields().isEmpty()) {
+                triggerSchemaEvolution(schema);
+                return;
+            }
+        }
+    }
+
+    private void triggerSchemaEvolution(ShreddingSchema schema) {
+        if (!schemaTriggered.compareAndSet(false, true)) {
+            return;
+        }
+
+        String schemaJson = schema.toJson();
+        LOG.info(
+                "Triggering Variant shredding schema evolution for table {}: {}",
+                tablePath,
+                schemaJson);
+
+        ApplyShreddingSchemaRequest request =
+                new ApplyShreddingSchemaRequest()
+                        .setTablePath(
+                                new PbTablePath()
+                                        .setDatabaseName(tablePath.getDatabaseName())
+                                        .setTableName(tablePath.getTableName()))
+                        .setShreddingSchemaJson(schemaJson);
+
+        rpcCaller
+                .apply(request)
+                .whenComplete(
+                        (resp, ex) -> {
+                            if (ex != null) {
+                                LOG.warn(
+                                        "Failed to apply Variant shredding schema for table {}, "
+                                                + "will retry on next row: {}",
+                                        tablePath,
+                                        ex.getMessage());
+                                schemaTriggered.set(false);
+                            } else {
+                                LOG.info(
+                                        "Successfully applied Variant shredding schema for table {}",
+                                        tablePath);
+                            }
+                        });
+    }
+}