[HUDI-4353] Column stats data skipping for flink (#6026)

2022-07-03 08:29:31 +08:00
parent bdf73b2650
commit 47792a3186
30 changed files with 1930 additions and 81 deletions
--- a/hudi-client/hudi-flink-client/src/main/java/org/apache/hudi/client/HoodieFlinkWriteClient.java
+++ b/hudi-client/hudi-flink-client/src/main/java/org/apache/hudi/client/HoodieFlinkWriteClient.java
@@ -74,6 +74,7 @@ import org.slf4j.LoggerFactory;
 import java.io.IOException;
 import java.nio.charset.StandardCharsets;
 import java.text.ParseException;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.Iterator;
 import java.util.List;
@@ -159,10 +160,14 @@ public class HoodieFlinkWriteClient<T extends HoodieRecordPayload> extends
        initTable(WriteOperationType.UPSERT, Option.ofNullable(instantTime));
    table.validateUpsertSchema();
    preWrite(instantTime, WriteOperationType.UPSERT_PREPPED, table.getMetaClient());
-    final HoodieWriteHandle<?, ?, ?, ?> writeHandle = getOrCreateWriteHandle(preppedRecords.get(0), getConfig(),
+    Map<String, List<HoodieRecord<T>>> preppedRecordsByFileId = preppedRecords.stream().parallel()
-        instantTime, table, preppedRecords.listIterator());
+        .collect(Collectors.groupingBy(r -> r.getCurrentLocation().getFileId()));
-    HoodieWriteMetadata<List<WriteStatus>> result = ((HoodieFlinkTable<T>) table).upsertPrepped(context, writeHandle, instantTime, preppedRecords);
+    return preppedRecordsByFileId.values().stream().parallel().map(records -> {
-    return postWrite(result, instantTime, table);
+      final HoodieWriteHandle<?, ?, ?, ?> writeHandle = getOrCreateWriteHandle(records.get(0), getConfig(),
          instantTime, table, records.listIterator());
      HoodieWriteMetadata<List<WriteStatus>> result = ((HoodieFlinkTable<T>) table).upsertPrepped(context, writeHandle, instantTime, records);
      return postWrite(result, instantTime, table);
    }).flatMap(Collection::stream).collect(Collectors.toList());
  }
  @Override
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/configuration/FlinkOptions.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/configuration/FlinkOptions.java
@@ -236,6 +236,13 @@ public class FlinkOptions extends HoodieConfig {
      .noDefaultValue()
      .withDescription("End commit instant for reading, the commit time format should be 'yyyyMMddHHmmss'");
  public static final ConfigOption<Boolean> READ_DATA_SKIPPING_ENABLED = ConfigOptions
      .key("read.data.skipping.enabled")
      .booleanType()
      .defaultValue(false)
      .withDescription("Enables data-skipping allowing queries to leverage indexes to reduce the search space by"
          + "skipping over files");
  // ------------------------------------------------------------------------
  //  Write Options
  // ------------------------------------------------------------------------
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/configuration/HadoopConfigurations.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/configuration/HadoopConfigurations.java
@@ -18,11 +18,11 @@
 package org.apache.hudi.configuration;
 import org.apache.hudi.util.FlinkClientUtil;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hadoop.fs.Path;
 import org.apache.hudi.util.FlinkClientUtil;
 import java.util.Map;
 /**
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/meta/CkpMetadata.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/meta/CkpMetadata.java
@@ -18,7 +18,6 @@
 package org.apache.hudi.sink.meta;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hudi.common.fs.FSUtils;
 import org.apache.hudi.common.table.HoodieTableMetaClient;
 import org.apache.hudi.common.util.ValidationUtils;
@@ -26,6 +25,7 @@ import org.apache.hudi.configuration.FlinkOptions;
 import org.apache.hudi.configuration.HadoopConfigurations;
 import org.apache.hudi.exception.HoodieException;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
 import org.slf4j.Logger;
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/utils/HiveSyncContext.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/utils/HiveSyncContext.java
@@ -18,7 +18,6 @@
 package org.apache.hudi.sink.utils;
 import org.apache.flink.annotation.VisibleForTesting;
 import org.apache.hudi.aws.sync.AwsGlueCatalogSyncTool;
 import org.apache.hudi.common.config.SerializableConfiguration;
 import org.apache.hudi.common.fs.FSUtils;
@@ -29,6 +28,7 @@ import org.apache.hudi.hive.HiveSyncTool;
 import org.apache.hudi.hive.ddl.HiveSyncMode;
 import org.apache.hudi.table.format.FilePathUtils;
 import org.apache.flink.annotation.VisibleForTesting;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.hive.conf.HiveConf;
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/utils/NonThrownExecutor.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/sink/utils/NonThrownExecutor.java
@@ -155,6 +155,10 @@ public class NonThrownExecutor implements AutoCloseable {
  // -------------------------------------------------------------------------
  //  Inner Class
  // -------------------------------------------------------------------------
  /**
   * The exception hook.
   */
  public interface ExceptionHook {
    void apply(String errMsg, Throwable t);
  }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/FileIndex.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/FileIndex.java
@@ -21,14 +21,24 @@ package org.apache.hudi.source;
 import org.apache.hudi.client.common.HoodieFlinkEngineContext;
 import org.apache.hudi.common.config.HoodieMetadataConfig;
 import org.apache.hudi.common.fs.FSUtils;
 import org.apache.hudi.common.util.collection.Pair;
 import org.apache.hudi.configuration.FlinkOptions;
 import org.apache.hudi.configuration.HadoopConfigurations;
 import org.apache.hudi.source.stats.ColumnStatsIndices;
 import org.apache.hudi.source.stats.ExpressionEvaluator;
 import org.apache.hudi.util.DataTypeUtils;
 import org.apache.hudi.util.ExpressionUtils;
 import org.apache.hudi.util.StreamerUtil;
 import org.apache.flink.annotation.VisibleForTesting;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.expressions.ResolvedExpression;
 import org.apache.flink.table.types.logical.RowType;
 import org.apache.hadoop.fs.FileStatus;
 import org.apache.hadoop.fs.Path;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 import javax.annotation.Nullable;
@@ -40,6 +50,7 @@ import java.util.List;
 import java.util.Map;
 import java.util.Properties;
 import java.util.Set;
 import java.util.stream.Collectors;
 /**
 * A file index which supports listing files efficiently through metadata table.
@@ -47,19 +58,26 @@ import java.util.Set;
 * <p>It caches the partition paths to avoid redundant look up.
 */
 public class FileIndex {
  private static final Logger LOG = LoggerFactory.getLogger(FileIndex.class);
  private final Path path;
  private final RowType rowType;
  private final HoodieMetadataConfig metadataConfig;
-  private List<String> partitionPaths; // cache of partition paths
+  private final boolean dataSkippingEnabled;
  private List<String> partitionPaths;      // cache of partition paths
  private List<ResolvedExpression> filters; // push down filters
  private final boolean tableExists;
-  private FileIndex(Path path, Configuration conf) {
+  private FileIndex(Path path, Configuration conf, RowType rowType) {
    this.path = path;
    this.rowType = rowType;
    this.metadataConfig = metadataConfig(conf);
    this.dataSkippingEnabled = conf.getBoolean(FlinkOptions.READ_DATA_SKIPPING_ENABLED);
    this.tableExists = StreamerUtil.tableExists(path.toString(), HadoopConfigurations.getHadoopConf(conf));
  }
-  public static FileIndex instance(Path path, Configuration conf) {
+  public static FileIndex instance(Path path, Configuration conf, RowType rowType) {
-    return new FileIndex(path, conf);
+    return new FileIndex(path, conf, rowType);
  }
  /**
@@ -119,9 +137,17 @@ public class FileIndex {
      return new FileStatus[0];
    }
    String[] partitions = getOrBuildPartitionPaths().stream().map(p -> fullPartitionPath(path, p)).toArray(String[]::new);
-    return FSUtils.getFilesInPartitions(HoodieFlinkEngineContext.DEFAULT, metadataConfig, path.toString(),
+    FileStatus[] allFileStatus = FSUtils.getFilesInPartitions(HoodieFlinkEngineContext.DEFAULT, metadataConfig, path.toString(),
            partitions, "/tmp/")
        .values().stream().flatMap(Arrays::stream).toArray(FileStatus[]::new);
    Set<String> candidateFiles = candidateFilesInMetadataTable(allFileStatus);
    if (candidateFiles == null) {
      // no need to filter by col stats or error occurs.
      return allFileStatus;
    }
    return Arrays.stream(allFileStatus).parallel()
        .filter(fileStatus -> candidateFiles.contains(fileStatus.getPath().getName()))
        .toArray(FileStatus[]::new);
  }
  /**
@@ -159,10 +185,96 @@ public class FileIndex {
    }
  }
  /**
   * Sets up pushed down filters.
   */
  public void setFilters(List<ResolvedExpression> filters) {
    if (filters.size() > 0) {
      this.filters = new ArrayList<>(filters);
    }
  }
  // -------------------------------------------------------------------------
  //  Utilities
  // -------------------------------------------------------------------------
  /**
   * Computes pruned list of candidate base-files' names based on provided list of data filters.
   * conditions, by leveraging Metadata Table's Column Statistics index (hereon referred as ColStats for brevity)
   * bearing "min", "max", "num_nulls" statistics for all columns.
   *
   * <p>NOTE: This method has to return complete set of candidate files, since only provided candidates will
   * ultimately be scanned as part of query execution. Hence, this method has to maintain the
   * invariant of conservatively including every base-file's name, that is NOT referenced in its index.
   *
   * <p>The {@code filters} must all be simple.
   *
   * @return list of pruned (data-skipped) candidate base-files' names
   */
  @Nullable
  private Set<String> candidateFilesInMetadataTable(FileStatus[] allFileStatus) {
    // NOTE: Data Skipping is only effective when it references columns that are indexed w/in
    //       the Column Stats Index (CSI). Following cases could not be effectively handled by Data Skipping:
    //          - Expressions on top-level column's fields (ie, for ex filters like "struct.field > 0", since
    //          CSI only contains stats for top-level columns, in this case for "struct")
    //          - Any expression not directly referencing top-level column (for ex, sub-queries, since there's
    //          nothing CSI in particular could be applied for)
    if (!metadataConfig.enabled() || !dataSkippingEnabled) {
      validateConfig();
      return null;
    }
    if (this.filters == null || this.filters.size() == 0) {
      return null;
    }
    String[] referencedCols = ExpressionUtils.referencedColumns(filters);
    if (referencedCols.length == 0) {
      return null;
    }
    try {
      final List<RowData> colStats = ColumnStatsIndices.readColumnStatsIndex(path.toString(), metadataConfig, referencedCols);
      final Pair<List<RowData>, String[]> colStatsTable = ColumnStatsIndices.transposeColumnStatsIndex(colStats, referencedCols, rowType);
      List<RowData> transposedColStats = colStatsTable.getLeft();
      String[] queryCols = colStatsTable.getRight();
      if (queryCols.length == 0) {
        // the indexed columns have no intersection with the referenced columns, returns early
        return null;
      }
      RowType.RowField[] queryFields = DataTypeUtils.projectRowFields(rowType, queryCols);
      Set<String> allIndexedFileNames = transposedColStats.stream().parallel()
          .map(row -> row.getString(0).toString())
          .collect(Collectors.toSet());
      Set<String> candidateFileNames = transposedColStats.stream().parallel()
          .filter(row -> ExpressionEvaluator.filterExprs(filters, row, queryFields))
          .map(row -> row.getString(0).toString())
          .collect(Collectors.toSet());
      // NOTE: Col-Stats Index isn't guaranteed to have complete set of statistics for every
      //       base-file: since it's bound to clustering, which could occur asynchronously
      //       at arbitrary point in time, and is not likely to be touching all the base files.
      //
      //       To close that gap, we manually compute the difference b/w all indexed (by col-stats-index)
      //       files and all outstanding base-files, and make sure that all base files not
      //       represented w/in the index are included in the output of this method
      Set<String> nonIndexedFileNames = Arrays.stream(allFileStatus)
          .map(fileStatus -> fileStatus.getPath().getName()).collect(Collectors.toSet());
      nonIndexedFileNames.removeAll(allIndexedFileNames);
      candidateFileNames.addAll(nonIndexedFileNames);
      return candidateFileNames;
    } catch (Throwable throwable) {
      LOG.warn("Read column stats for data skipping error", throwable);
      return null;
    }
  }
  private void validateConfig() {
    if (dataSkippingEnabled && !metadataConfig.enabled()) {
      LOG.warn("Data skipping requires Metadata Table to be enabled! "
          + "isMetadataTableEnabled = {}", metadataConfig.enabled());
    }
  }
  /**
   * Returns all the relative partition paths.
   *
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/IncrementalInputSplits.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/IncrementalInputSplits.java
@@ -35,6 +35,7 @@ import org.apache.hudi.table.format.mor.MergeOnReadInputSplit;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.core.fs.Path;
 import org.apache.flink.table.types.logical.RowType;
 import org.apache.hadoop.fs.FileStatus;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -77,6 +78,7 @@ public class IncrementalInputSplits implements Serializable {
  private static final Logger LOG = LoggerFactory.getLogger(IncrementalInputSplits.class);
  private final Configuration conf;
  private final Path path;
  private final RowType rowType;
  private final long maxCompactionMemoryInBytes;
  // for partition pruning
  private final Set<String> requiredPartitions;
@@ -86,11 +88,13 @@ public class IncrementalInputSplits implements Serializable {
  private IncrementalInputSplits(
      Configuration conf,
      Path path,
      RowType rowType,
      long maxCompactionMemoryInBytes,
      @Nullable Set<String> requiredPartitions,
      boolean skipCompaction) {
    this.conf = conf;
    this.path = path;
    this.rowType = rowType;
    this.maxCompactionMemoryInBytes = maxCompactionMemoryInBytes;
    this.requiredPartitions = requiredPartitions;
    this.skipCompaction = skipCompaction;
@@ -167,7 +171,7 @@ public class IncrementalInputSplits implements Serializable {
    if (instantRange == null) {
      // reading from the earliest, scans the partitions and files directly.
-      FileIndex fileIndex = FileIndex.instance(new org.apache.hadoop.fs.Path(path.toUri()), conf);
+      FileIndex fileIndex = FileIndex.instance(new org.apache.hadoop.fs.Path(path.toUri()), conf, rowType);
      if (this.requiredPartitions != null) {
        // apply partition push down
        fileIndex.setPartitionPaths(this.requiredPartitions);
@@ -349,6 +353,7 @@ public class IncrementalInputSplits implements Serializable {
  public static class Builder {
    private Configuration conf;
    private Path path;
    private RowType rowType;
    private long maxCompactionMemoryInBytes;
    // for partition pruning
    private Set<String> requiredPartitions;
@@ -368,6 +373,11 @@ public class IncrementalInputSplits implements Serializable {
      return this;
    }
    public Builder rowType(RowType rowType) {
      this.rowType = rowType;
      return this;
    }
    public Builder maxCompactionMemoryInBytes(long maxCompactionMemoryInBytes) {
      this.maxCompactionMemoryInBytes = maxCompactionMemoryInBytes;
      return this;
@@ -384,7 +394,8 @@ public class IncrementalInputSplits implements Serializable {
    }
    public IncrementalInputSplits build() {
-      return new IncrementalInputSplits(Objects.requireNonNull(this.conf), Objects.requireNonNull(this.path),
+      return new IncrementalInputSplits(
          Objects.requireNonNull(this.conf), Objects.requireNonNull(this.path), Objects.requireNonNull(this.rowType),
          this.maxCompactionMemoryInBytes, this.requiredPartitions, this.skipCompaction);
    }
  }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/StreamReadMonitoringFunction.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/StreamReadMonitoringFunction.java
@@ -36,6 +36,7 @@ import org.apache.flink.runtime.state.FunctionSnapshotContext;
 import org.apache.flink.streaming.api.checkpoint.CheckpointedFunction;
 import org.apache.flink.streaming.api.functions.source.RichSourceFunction;
 import org.apache.flink.streaming.api.functions.source.SourceFunction;
 import org.apache.flink.table.types.logical.RowType;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -99,6 +100,7 @@ public class StreamReadMonitoringFunction
  public StreamReadMonitoringFunction(
      Configuration conf,
      Path path,
      RowType rowType,
      long maxCompactionMemoryInBytes,
      @Nullable Set<String> requiredPartitionPaths) {
    this.conf = conf;
@@ -107,6 +109,7 @@ public class StreamReadMonitoringFunction
    this.incrementalInputSplits = IncrementalInputSplits.builder()
        .conf(conf)
        .path(path)
        .rowType(rowType)
        .maxCompactionMemoryInBytes(maxCompactionMemoryInBytes)
        .requiredPartitions(requiredPartitionPaths)
        .skipCompaction(conf.getBoolean(FlinkOptions.READ_STREAMING_SKIP_COMPACT))
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/stats/ColumnStatsIndices.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/stats/ColumnStatsIndices.java
@@ -0,0 +1,377 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.source.stats;
 import org.apache.hudi.avro.model.HoodieMetadataRecord;
 import org.apache.hudi.client.common.HoodieFlinkEngineContext;
 import org.apache.hudi.common.config.HoodieMetadataConfig;
 import org.apache.hudi.common.data.HoodieData;
 import org.apache.hudi.common.model.HoodieRecord;
 import org.apache.hudi.common.table.view.FileSystemViewStorageConfig;
 import org.apache.hudi.common.util.ValidationUtils;
 import org.apache.hudi.common.util.collection.Pair;
 import org.apache.hudi.common.util.hash.ColumnIndexID;
 import org.apache.hudi.exception.HoodieException;
 import org.apache.hudi.metadata.HoodieMetadataPayload;
 import org.apache.hudi.metadata.HoodieTableMetadata;
 import org.apache.hudi.metadata.HoodieTableMetadataUtil;
 import org.apache.hudi.util.AvroSchemaConverter;
 import org.apache.hudi.util.AvroToRowDataConverters;
 import org.apache.hudi.util.RowDataProjection;
 import org.apache.avro.generic.GenericRecord;
 import org.apache.flink.table.data.GenericRowData;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.data.StringData;
 import org.apache.flink.table.types.DataType;
 import org.apache.flink.table.types.logical.LogicalType;
 import org.apache.flink.table.types.logical.RowType;
 import org.apache.flink.table.types.logical.TimeType;
 import org.apache.flink.table.types.logical.TimestampType;
 import java.io.IOException;
 import java.util.Arrays;
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
 import java.util.SortedMap;
 import java.util.TreeMap;
 import java.util.TreeSet;
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 import static org.apache.hudi.common.util.ValidationUtils.checkState;
 /**
 * Utilities for abstracting away heavy-lifting of interactions with Metadata Table's Column Stats Index,
 * providing convenient interfaces to read it, transpose, etc.
 */
 public class ColumnStatsIndices {
  private static final DataType METADATA_DATA_TYPE = getMetadataDataType();
  private static final DataType COL_STATS_DATA_TYPE = getColStatsDataType();
  private static final int[] COL_STATS_TARGET_POS = getColStatsTargetPos();
  // the column schema:
  // |- file_name: string
  // |- min_val: row
  // |- max_val: row
  // |- null_cnt: long
  // |- val_cnt: long
  // |- column_name: string
  private static final int ORD_FILE_NAME = 0;
  private static final int ORD_MIN_VAL = 1;
  private static final int ORD_MAX_VAL = 2;
  private static final int ORD_NULL_CNT = 3;
  private static final int ORD_VAL_CNT = 4;
  private static final int ORD_COL_NAME = 5;
  private ColumnStatsIndices() {
  }
  public static List<RowData> readColumnStatsIndex(String basePath, HoodieMetadataConfig metadataConfig, String[] targetColumns) {
    // NOTE: If specific columns have been provided, we can considerably trim down amount of data fetched
    //       by only fetching Column Stats Index records pertaining to the requested columns.
    //       Otherwise, we fall back to read whole Column Stats Index
    ValidationUtils.checkArgument(targetColumns.length > 0,
        "Column stats is only valid when push down filters have referenced columns");
    final List<RowData> metadataRows = readColumnStatsIndexByColumns(basePath, targetColumns, metadataConfig);
    return projectNestedColStatsColumns(metadataRows);
  }
  private static List<RowData> projectNestedColStatsColumns(List<RowData> rows) {
    int pos = HoodieMetadataRecord.SCHEMA$.getField(HoodieMetadataPayload.SCHEMA_FIELD_ID_COLUMN_STATS).pos();
    RowDataProjection projection = RowDataProjection.instanceV2((RowType) COL_STATS_DATA_TYPE.getLogicalType(), COL_STATS_TARGET_POS);
    return rows.stream().parallel()
        .map(row -> {
          RowData columnStatsField = row.getRow(pos, 9);
          return projection.project(columnStatsField);
        }).collect(Collectors.toList());
  }
  /**
   * Transposes and converts the raw table format of the Column Stats Index representation,
   * where each row/record corresponds to individual (column, file) pair, into the table format
   * where each row corresponds to single file with statistic for individual columns collated
   * w/in such row:
   * <p>
   * Metadata Table Column Stats Index format:
   *
   * <pre>
   *  +---------------------------+------------+------------+------------+-------------+
   *  |        fileName           | columnName |  minValue  |  maxValue  |  num_nulls  |
   *  +---------------------------+------------+------------+------------+-------------+
   *  | one_base_file.parquet     |          A |          1 |         10 |           0 |
   *  | another_base_file.parquet |          A |        -10 |          0 |           5 |
   *  +---------------------------+------------+------------+------------+-------------+
   * </pre>
   * <p>
   * Returned table format
   *
   * <pre>
   *  +---------------------------+------------+------------+-------------+
   *  |          file             | A_minValue | A_maxValue | A_nullCount |
   *  +---------------------------+------------+------------+-------------+
   *  | one_base_file.parquet     |          1 |         10 |           0 |
   *  | another_base_file.parquet |        -10 |          0 |           5 |
   *  +---------------------------+------------+------------+-------------+
   * </pre>
   * <p>
   * NOTE: Column Stats Index might potentially contain statistics for many columns (if not all), while
   * query at hand might only be referencing a handful of those. As such, we collect all the
   * column references from the filtering expressions, and only transpose records corresponding to the
   * columns referenced in those
   *
   * @param colStats     RowData list bearing raw Column Stats Index table
   * @param queryColumns target columns to be included into the final table
   * @param tableSchema  schema of the source data table
   * @return reshaped table according to the format outlined above
   */
  public static Pair<List<RowData>, String[]> transposeColumnStatsIndex(List<RowData> colStats, String[] queryColumns, RowType tableSchema) {
    Map<String, LogicalType> tableFieldTypeMap = tableSchema.getFields().stream()
        .collect(Collectors.toMap(RowType.RowField::getName, RowType.RowField::getType));
    // NOTE: We have to collect list of indexed columns to make sure we properly align the rows
    //       w/in the transposed dataset: since some files might not have all the columns indexed
    //       either due to the Column Stats Index config changes, schema evolution, etc. we have
    //       to make sure that all the rows w/in transposed data-frame are properly padded (with null
    //       values) for such file-column combinations
    Set<String> indexedColumns = colStats.stream().map(row -> row.getString(ORD_COL_NAME)
        .toString()).collect(Collectors.toSet());
    // NOTE: We're sorting the columns to make sure final index schema matches layout
    //       of the transposed table
    TreeSet<String> sortedTargetColumns = Arrays.stream(queryColumns).sorted()
        .filter(indexedColumns::contains)
        .collect(Collectors.toCollection(TreeSet::new));
    Map<StringData, List<RowData>> fileNameToRows = colStats.stream().parallel()
        .filter(row -> sortedTargetColumns.contains(row.getString(ORD_COL_NAME).toString()))
        .map(row -> {
          if (row.isNullAt(ORD_MIN_VAL) && row.isNullAt(ORD_MAX_VAL)) {
            // Corresponding row could be null in either of the 2 cases
            //    - Column contains only null values (in that case both min/max have to be nulls)
            //    - This is a stubbed Column Stats record (used as a tombstone)
            return row;
          } else {
            String colName = row.getString(ORD_COL_NAME).toString();
            LogicalType colType = tableFieldTypeMap.get(colName);
            return unpackMinMaxVal(row, colType);
          }
        }).collect(Collectors.groupingBy(rowData -> rowData.getString(ORD_FILE_NAME)));
    return Pair.of(foldRowsByFiles(sortedTargetColumns, fileNameToRows), sortedTargetColumns.toArray(new String[0]));
  }
  private static List<RowData> foldRowsByFiles(
      TreeSet<String> sortedTargetColumns,
      Map<StringData, List<RowData>> fileNameToRows) {
    return fileNameToRows.values().stream().parallel().map(rows -> {
      // Rows seq is always non-empty (otherwise it won't be grouped into)
      StringData fileName = rows.get(0).getString(ORD_FILE_NAME);
      long valueCount = rows.get(0).getLong(ORD_VAL_CNT);
      // To properly align individual rows (corresponding to a file) w/in the transposed projection, we need
      // to align existing column-stats for individual file with the list of expected ones for the
      // whole transposed projection (a superset of all files)
      Map<String, RowData> columnRowsMap = rows.stream()
          .collect(Collectors.toMap(row -> row.getString(ORD_COL_NAME).toString(), row -> row));
      SortedMap<String, RowData> alignedColumnRowsMap = new TreeMap<>();
      sortedTargetColumns.forEach(col -> alignedColumnRowsMap.put(col, columnRowsMap.get(col)));
      List<Tuple3> columnStats = alignedColumnRowsMap.values().stream().map(row -> {
        if (row == null) {
          // NOTE: Since we're assuming missing column to essentially contain exclusively
          //       null values, we set null-count to be equal to value-count (this behavior is
          //       consistent with reading non-existent columns from Parquet)
          return Tuple3.of(null, null, valueCount);
        } else {
          GenericRowData gr = (GenericRowData) row;
          return Tuple3.of(gr.getField(ORD_MIN_VAL), gr.getField(ORD_MAX_VAL), gr.getField(ORD_NULL_CNT));
        }
      }).collect(Collectors.toList());
      GenericRowData foldedRow = new GenericRowData(2 + 3 * columnStats.size());
      foldedRow.setField(0, fileName);
      foldedRow.setField(1, valueCount);
      for (int i = 0; i < columnStats.size(); i++) {
        Tuple3 stats = columnStats.get(i);
        int startPos = 2 + 3 * i;
        foldedRow.setField(startPos, stats.f0);
        foldedRow.setField(startPos + 1, stats.f1);
        foldedRow.setField(startPos + 2, stats.f2);
      }
      return foldedRow;
    }).collect(Collectors.toList());
  }
  private static RowData unpackMinMaxVal(
      RowData row,
      LogicalType colType) {
    RowData minValueStruct = row.getRow(ORD_MIN_VAL, 1);
    RowData maxValueStruct = row.getRow(ORD_MAX_VAL, 1);
    checkState(minValueStruct != null && maxValueStruct != null,
        "Invalid Column Stats record: either both min/max have to be null, or both have to be non-null");
    Object minValue = tryUnpackNonNullVal(minValueStruct, colType);
    Object maxValue = tryUnpackNonNullVal(maxValueStruct, colType);
    // the column schema:
    // |- file_name: string
    // |- min_val: row
    // |- max_val: row
    // |- null_cnt: long
    // |- val_cnt: long
    // |- column_name: string
    GenericRowData unpackedRow = new GenericRowData(row.getArity());
    unpackedRow.setField(0, row.getString(0));
    unpackedRow.setField(1, minValue);
    unpackedRow.setField(2, maxValue);
    unpackedRow.setField(3, row.getLong(3));
    unpackedRow.setField(4, row.getLong(4));
    unpackedRow.setField(5, row.getString(5));
    return unpackedRow;
  }
  private static Object tryUnpackNonNullVal(RowData rowData, LogicalType colType) {
    for (int i = 0; i < rowData.getArity(); i++) {
      // row data converted from avro is definitely generic.
      Object nested = ((GenericRowData) rowData).getField(i);
      if (nested != null) {
        return doUnpack(nested, colType);
      }
    }
    return null;
  }
  private static Object doUnpack(Object rawVal, LogicalType logicalType) {
    // fix time unit
    switch (logicalType.getTypeRoot()) {
      case TIME_WITHOUT_TIME_ZONE:
        TimeType timeType = (TimeType) logicalType;
        if (timeType.getPrecision() == 3) {
          // the precision in HoodieMetadata is 6
          rawVal = ((Long) rawVal) / 1000;
        } else if (timeType.getPrecision() == 9) {
          rawVal = ((Long) rawVal) * 1000;
        }
        break;
      case TIMESTAMP_WITHOUT_TIME_ZONE:
        TimestampType timestampType = (TimestampType) logicalType;
        if (timestampType.getPrecision() == 3) {
          // the precision in HoodieMetadata is 6
          rawVal = ((Long) rawVal) / 1000;
        } else if (timestampType.getPrecision() == 9) {
          rawVal = ((Long) rawVal) * 1000;
        }
        break;
      default:
        // no operation
    }
    AvroToRowDataConverters.AvroToRowDataConverter converter = AvroToRowDataConverters.createConverter(logicalType);
    return converter.convert(rawVal);
  }
  private static List<RowData> readColumnStatsIndexByColumns(
      String basePath,
      String[] targetColumns,
      HoodieMetadataConfig metadataConfig) {
    // Read Metadata Table's Column Stats Index into Flink's RowData list by
    //    - Fetching the records from CSI by key-prefixes (encoded column names)
    //    - Deserializing fetched records into [[RowData]]s
    HoodieTableMetadata metadataTable = HoodieTableMetadata.create(
        HoodieFlinkEngineContext.DEFAULT,
        metadataConfig, basePath,
        FileSystemViewStorageConfig.SPILLABLE_DIR.defaultValue());
    // TODO encoding should be done internally w/in HoodieBackedTableMetadata
    List<String> encodedTargetColumnNames = Arrays.stream(targetColumns)
        .map(colName -> new ColumnIndexID(colName).asBase64EncodedString()).collect(Collectors.toList());
    HoodieData<HoodieRecord<HoodieMetadataPayload>> records =
        metadataTable.getRecordsByKeyPrefixes(encodedTargetColumnNames, HoodieTableMetadataUtil.PARTITION_NAME_COLUMN_STATS);
    org.apache.hudi.util.AvroToRowDataConverters.AvroToRowDataConverter converter =
        AvroToRowDataConverters.createRowConverter((RowType) METADATA_DATA_TYPE.getLogicalType());
    return records.collectAsList().stream().parallel().map(record -> {
          // schema and props are ignored for generating metadata record from the payload
          // instead, the underlying file system, or bloom filter, or columns stats metadata (part of payload) are directly used
          GenericRecord genericRecord;
          try {
            genericRecord = (GenericRecord) record.getData().getInsertValue(null, null).orElse(null);
          } catch (IOException e) {
            throw new HoodieException("Exception while getting insert value from metadata payload");
          }
          return (RowData) converter.convert(genericRecord);
        }
    ).collect(Collectors.toList());
  }
  // -------------------------------------------------------------------------
  //  Utilities
  // -------------------------------------------------------------------------
  private static class Tuple3 {
    public Object f0;
    public Object f1;
    public Object f2;
    private Tuple3(Object f0, Object f1, Object f2) {
      this.f0 = f0;
      this.f1 = f1;
      this.f2 = f2;
    }
    public static Tuple3 of(Object f0, Object f1, Object f2) {
      return new Tuple3(f0, f1, f2);
    }
  }
  private static DataType getMetadataDataType() {
    return AvroSchemaConverter.convertToDataType(HoodieMetadataRecord.SCHEMA$);
  }
  private static DataType getColStatsDataType() {
    int pos = HoodieMetadataRecord.SCHEMA$.getField(HoodieMetadataPayload.SCHEMA_FIELD_ID_COLUMN_STATS).pos();
    return METADATA_DATA_TYPE.getChildren().get(pos);
  }
  // the column schema:
  // |- file_name: string
  // |- min_val: row
  // |- max_val: row
  // |- null_cnt: long
  // |- val_cnt: long
  // |- column_name: string
  private static int[] getColStatsTargetPos() {
    RowType colStatsRowType = (RowType) COL_STATS_DATA_TYPE.getLogicalType();
    return Stream.of(
            HoodieMetadataPayload.COLUMN_STATS_FIELD_FILE_NAME,
            HoodieMetadataPayload.COLUMN_STATS_FIELD_MIN_VALUE,
            HoodieMetadataPayload.COLUMN_STATS_FIELD_MAX_VALUE,
            HoodieMetadataPayload.COLUMN_STATS_FIELD_NULL_COUNT,
            HoodieMetadataPayload.COLUMN_STATS_FIELD_VALUE_COUNT,
            HoodieMetadataPayload.COLUMN_STATS_FIELD_COLUMN_NAME)
        .mapToInt(colStatsRowType::getFieldIndex)
        .toArray();
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/stats/ExpressionEvaluator.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/source/stats/ExpressionEvaluator.java
@@ -0,0 +1,552 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.source.stats;
 import org.apache.hudi.common.util.ValidationUtils;
 import org.apache.hudi.util.ExpressionUtils;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.expressions.CallExpression;
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.expressions.FieldReferenceExpression;
 import org.apache.flink.table.expressions.ResolvedExpression;
 import org.apache.flink.table.expressions.ValueLiteralExpression;
 import org.apache.flink.table.functions.BuiltInFunctionDefinitions;
 import org.apache.flink.table.functions.FunctionDefinition;
 import org.apache.flink.table.types.logical.DecimalType;
 import org.apache.flink.table.types.logical.LogicalType;
 import org.apache.flink.table.types.logical.RowType;
 import javax.validation.constraints.NotNull;
 import java.math.BigDecimal;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.List;
 /**
 * Tool to evaluate the {@link org.apache.flink.table.expressions.ResolvedExpression}s.
 */
 public class ExpressionEvaluator {
  private static final int IN_PREDICATE_LIMIT = 200;
  /**
   * Filter the index row with specific data filters and query fields.
   *
   * @param filters     The pushed down data filters
   * @param indexRow    The index row
   * @param queryFields The query fields referenced by the filters
   * @return true if the index row should be considered as a candidate
   */
  public static boolean filterExprs(List<ResolvedExpression> filters, RowData indexRow, RowType.RowField[] queryFields) {
    for (ResolvedExpression filter : filters) {
      if (!Evaluator.bindCall((CallExpression) filter, indexRow, queryFields).eval()) {
        return false;
      }
    }
    return true;
  }
  /**
   * Used for deciding whether the literal values match the column stats.
   * The evaluator can be nested.
   */
  public abstract static class Evaluator {
    // the constant literal value
    protected Object val;
    // column stats
    protected Object minVal;
    protected Object maxVal;
    protected long nullCnt = 0;
    // referenced field type
    protected LogicalType type;
    /**
     * Binds the evaluator with specific call expression.
     *
     * <p>Three steps to bind the call:
     * 1. map the evaluator instance;
     * 2. bind the field reference;
     * 3. bind the column stats.
     *
     * <p>Normalize the expression to simplify the following decision logic:
     * always put the literal expression in the right.
     */
    public static Evaluator bindCall(CallExpression call, RowData indexRow, RowType.RowField[] queryFields) {
      FunctionDefinition funDef = call.getFunctionDefinition();
      List<Expression> childExprs = call.getChildren();
      boolean normalized = childExprs.get(0) instanceof FieldReferenceExpression;
      final Evaluator evaluator;
      if (BuiltInFunctionDefinitions.NOT.equals(funDef)) {
        evaluator = Not.getInstance();
        Evaluator childEvaluator = bindCall((CallExpression) childExprs.get(0), indexRow, queryFields);
        return ((Not) evaluator).bindEvaluator(childEvaluator);
      }
      if (BuiltInFunctionDefinitions.AND.equals(funDef)) {
        evaluator = And.getInstance();
        Evaluator evaluator1 = bindCall((CallExpression) childExprs.get(0), indexRow, queryFields);
        Evaluator evaluator2 = bindCall((CallExpression) childExprs.get(1), indexRow, queryFields);
        return ((And) evaluator).bindEvaluator(evaluator1, evaluator2);
      }
      if (BuiltInFunctionDefinitions.OR.equals(funDef)) {
        evaluator = Or.getInstance();
        Evaluator evaluator1 = bindCall((CallExpression) childExprs.get(0), indexRow, queryFields);
        Evaluator evaluator2 = bindCall((CallExpression) childExprs.get(1), indexRow, queryFields);
        return ((Or) evaluator).bindEvaluator(evaluator1, evaluator2);
      }
      // handle IN specifically
      if (BuiltInFunctionDefinitions.IN.equals(funDef)) {
        ValidationUtils.checkState(normalized, "The IN expression expects to be normalized");
        evaluator = In.getInstance();
        FieldReferenceExpression rExpr = (FieldReferenceExpression) childExprs.get(0);
        evaluator.bindFieldReference(rExpr);
        ((In) evaluator).bindVals(getInLiteralVals(childExprs));
        return evaluator.bindColStats(indexRow, queryFields, rExpr);
      }
      // handle unary operators
      if (BuiltInFunctionDefinitions.IS_NULL.equals(funDef)) {
        FieldReferenceExpression rExpr = (FieldReferenceExpression) childExprs.get(0);
        return IsNull.getInstance()
            .bindFieldReference(rExpr)
            .bindColStats(indexRow, queryFields, rExpr);
      } else if (BuiltInFunctionDefinitions.IS_NOT_NULL.equals(funDef)) {
        FieldReferenceExpression rExpr = (FieldReferenceExpression) childExprs.get(0);
        return IsNotNull.getInstance()
            .bindFieldReference(rExpr)
            .bindColStats(indexRow, queryFields, rExpr);
      }
      // handle binary operators
      if (BuiltInFunctionDefinitions.EQUALS.equals(funDef)) {
        evaluator = EqualTo.getInstance();
      } else if (BuiltInFunctionDefinitions.NOT_EQUALS.equals(funDef)) {
        evaluator = NotEqualTo.getInstance();
      } else if (BuiltInFunctionDefinitions.LESS_THAN.equals(funDef)) {
        evaluator = normalized ? LessThan.getInstance() : GreaterThan.getInstance();
      } else if (BuiltInFunctionDefinitions.GREATER_THAN.equals(funDef)) {
        evaluator = normalized ? GreaterThan.getInstance() : LessThan.getInstance();
      } else if (BuiltInFunctionDefinitions.LESS_THAN_OR_EQUAL.equals(funDef)) {
        evaluator = normalized ? LessThanOrEqual.getInstance() : GreaterThanOrEqual.getInstance();
      } else if (BuiltInFunctionDefinitions.GREATER_THAN_OR_EQUAL.equals(funDef)) {
        evaluator = normalized ? GreaterThanOrEqual.getInstance() : LessThanOrEqual.getInstance();
      } else {
        throw new AssertionError("Unexpected function definition " + funDef);
      }
      FieldReferenceExpression rExpr = normalized
          ? (FieldReferenceExpression) childExprs.get(0)
          : (FieldReferenceExpression) childExprs.get(1);
      ValueLiteralExpression vExpr = normalized
          ? (ValueLiteralExpression) childExprs.get(1)
          : (ValueLiteralExpression) childExprs.get(0);
      evaluator
          .bindFieldReference(rExpr)
          .bindVal(vExpr)
          .bindColStats(indexRow, queryFields, rExpr);
      return evaluator;
    }
    public Evaluator bindColStats(
        RowData indexRow,
        RowType.RowField[] queryFields,
        FieldReferenceExpression expr) {
      int colPos = -1;
      for (int i = 0; i < queryFields.length; i++) {
        if (expr.getName().equals(queryFields[i].getName())) {
          colPos = i;
        }
      }
      ValidationUtils.checkState(colPos != -1, "Can not find column " + expr.getName());
      int startPos = 2 + colPos * 3;
      LogicalType colType = queryFields[colPos].getType();
      Object minVal = indexRow.isNullAt(startPos) ? null : getValAsJavaObj(indexRow, startPos, colType);
      Object maxVal = indexRow.isNullAt(startPos + 1) ? null : getValAsJavaObj(indexRow, startPos + 1, colType);
      long nullCnt = indexRow.getLong(startPos + 2);
      this.minVal = minVal;
      this.maxVal = maxVal;
      this.nullCnt = nullCnt;
      return this;
    }
    public Evaluator bindVal(ValueLiteralExpression vExpr) {
      this.val = ExpressionUtils.getValueFromLiteral(vExpr);
      return this;
    }
    public Evaluator bindFieldReference(FieldReferenceExpression expr) {
      this.type = expr.getOutputDataType().getLogicalType();
      return this;
    }
    public abstract boolean eval();
  }
  /**
   * To evaluate = expr.
   */
  public static class EqualTo extends Evaluator {
    public static EqualTo getInstance() {
      return new EqualTo();
    }
    @Override
    public boolean eval() {
      if (this.minVal == null || this.maxVal == null || this.val == null) {
        return false;
      }
      if (compare(this.minVal, this.val, this.type) > 0) {
        return false;
      }
      return compare(this.maxVal, this.val, this.type) >= 0;
    }
  }
  /**
   * To evaluate <> expr.
   */
  public static class NotEqualTo extends Evaluator {
    public static NotEqualTo getInstance() {
      return new NotEqualTo();
    }
    @Override
    public boolean eval() {
      // because the bounds are not necessarily a min or max value, this cannot be answered using
      // them. notEq(col, X) with (X, Y) doesn't guarantee that X is a value in col.
      return true;
    }
  }
  /**
   * To evaluate IS NULL expr.
   */
  public static class IsNull extends Evaluator {
    public static IsNull getInstance() {
      return new IsNull();
    }
    @Override
    public boolean eval() {
      return this.nullCnt > 0;
    }
  }
  /**
   * To evaluate IS NOT NULL expr.
   */
  public static class IsNotNull extends Evaluator {
    public static IsNotNull getInstance() {
      return new IsNotNull();
    }
    @Override
    public boolean eval() {
      // should consider FLOAT/DOUBLE & NAN
      return this.minVal != null || this.nullCnt <= 0;
    }
  }
  /**
   * To evaluate < expr.
   */
  public static class LessThan extends Evaluator {
    public static LessThan getInstance() {
      return new LessThan();
    }
    @Override
    public boolean eval() {
      if (this.minVal == null) {
        return false;
      }
      return compare(this.minVal, this.val, this.type) < 0;
    }
  }
  /**
   * To evaluate > expr.
   */
  public static class GreaterThan extends Evaluator {
    public static GreaterThan getInstance() {
      return new GreaterThan();
    }
    @Override
    public boolean eval() {
      if (this.maxVal == null) {
        return false;
      }
      return compare(this.maxVal, this.val, this.type) > 0;
    }
  }
  /**
   * To evaluate <= expr.
   */
  public static class LessThanOrEqual extends Evaluator {
    public static LessThanOrEqual getInstance() {
      return new LessThanOrEqual();
    }
    @Override
    public boolean eval() {
      if (this.minVal == null) {
        return false;
      }
      return compare(this.minVal, this.val, this.type) <= 0;
    }
  }
  /**
   * To evaluate >= expr.
   */
  public static class GreaterThanOrEqual extends Evaluator {
    public static GreaterThanOrEqual getInstance() {
      return new GreaterThanOrEqual();
    }
    @Override
    public boolean eval() {
      if (this.maxVal == null) {
        return false;
      }
      return compare(this.maxVal, this.val, this.type) >= 0;
    }
  }
  /**
   * To evaluate IN expr.
   */
  public static class In extends Evaluator {
    public static In getInstance() {
      return new In();
    }
    private Object[] vals;
    @Override
    public boolean eval() {
      if (this.minVal == null) {
        return false; // values are all null and literalSet cannot contain null.
      }
      if (vals.length > IN_PREDICATE_LIMIT) {
        // skip evaluating the predicate if the number of values is too big
        return true;
      }
      vals = Arrays.stream(vals).filter(v -> compare(this.minVal, v, this.type) <= 0).toArray();
      if (vals.length == 0) { // if all values are less than lower bound, rows cannot match.
        return false;
      }
      vals = Arrays.stream(vals).filter(v -> compare(this.maxVal, v, this.type) >= 0).toArray();
      if (vals.length == 0) { // if all remaining values are greater than upper bound, rows cannot match.
        return false;
      }
      return true;
    }
    public void bindVals(Object... vals) {
      this.vals = vals;
    }
  }
  // component predicate
  /**
   * To evaluate NOT expr.
   */
  public static class Not extends Evaluator {
    public static Not getInstance() {
      return new Not();
    }
    private Evaluator evaluator;
    @Override
    public boolean eval() {
      return !this.evaluator.eval();
    }
    public Evaluator bindEvaluator(Evaluator evaluator) {
      this.evaluator = evaluator;
      return this;
    }
  }
  /**
   * To evaluate AND expr.
   */
  public static class And extends Evaluator {
    public static And getInstance() {
      return new And();
    }
    private Evaluator[] evaluators;
    @Override
    public boolean eval() {
      for (Evaluator evaluator : evaluators) {
        if (!evaluator.eval()) {
          return false;
        }
      }
      return true;
    }
    public Evaluator bindEvaluator(Evaluator... evaluators) {
      this.evaluators = evaluators;
      return this;
    }
  }
  /**
   * To evaluate OR expr.
   */
  public static class Or extends Evaluator {
    public static Or getInstance() {
      return new Or();
    }
    private Evaluator[] evaluators;
    @Override
    public boolean eval() {
      for (Evaluator evaluator : evaluators) {
        if (evaluator.eval()) {
          return true;
        }
      }
      return false;
    }
    public Evaluator bindEvaluator(Evaluator... evaluators) {
      this.evaluators = evaluators;
      return this;
    }
  }
  // -------------------------------------------------------------------------
  //  Utilities
  // -------------------------------------------------------------------------
  private static int compare(@NotNull Object val1, @NotNull Object val2, LogicalType logicalType) {
    switch (logicalType.getTypeRoot()) {
      case TIMESTAMP_WITHOUT_TIME_ZONE:
      case TIME_WITHOUT_TIME_ZONE:
      case DATE:
        return ((Long) val1).compareTo((Long) val2);
      case BOOLEAN:
        return ((Boolean) val1).compareTo((Boolean) val2);
      case TINYINT:
      case SMALLINT:
      case INTEGER:
        return ((Integer) val1).compareTo((Integer) val2);
      case FLOAT:
        return ((Float) val1).compareTo((Float) val2);
      case DOUBLE:
        return ((Double) val1).compareTo((Double) val2);
      case BINARY:
      case VARBINARY:
        return compareBytes((byte[]) val1, (byte[]) val2);
      case CHAR:
      case VARCHAR:
        return ((String) val1).compareTo((String) val2);
      case DECIMAL:
        return ((BigDecimal) val1).compareTo((BigDecimal) val2);
      default:
        throw new UnsupportedOperationException("Unsupported type: " + logicalType);
    }
  }
  private static int compareBytes(byte[] v1, byte[] v2) {
    int len1 = v1.length;
    int len2 = v2.length;
    int lim = Math.min(len1, len2);
    int k = 0;
    while (k < lim) {
      byte c1 = v1[k];
      byte c2 = v2[k];
      if (c1 != c2) {
        return c1 - c2;
      }
      k++;
    }
    return len1 - len2;
  }
  /**
   * Returns the IN expression literal values.
   */
  private static Object[] getInLiteralVals(List<Expression> childExprs) {
    List<Object> vals = new ArrayList<>();
    for (int i = 1; i < childExprs.size(); i++) {
      vals.add(ExpressionUtils.getValueFromLiteral((ValueLiteralExpression) childExprs.get(i)));
    }
    return vals.toArray();
  }
  /**
   * Returns the value as Java object at position {@code pos} of row {@code indexRow}.
   */
  private static Object getValAsJavaObj(RowData indexRow, int pos, LogicalType colType) {
    switch (colType.getTypeRoot()) {
      // NOTE: Since we can't rely on Avro's "date", and "timestamp-micros" logical-types, we're
      //       manually encoding corresponding values as int and long w/in the Column Stats Index and
      //       here we have to decode those back into corresponding logical representation.
      case TIMESTAMP_WITHOUT_TIME_ZONE:
      case TIME_WITHOUT_TIME_ZONE:
      case DATE:
        return indexRow.getLong(pos);
      // NOTE: All integral types of size less than Int are encoded as Ints in MT
      case BOOLEAN:
        return indexRow.getBoolean(pos);
      case TINYINT:
      case SMALLINT:
      case INTEGER:
        return indexRow.getInt(pos);
      case FLOAT:
        return indexRow.getFloat(pos);
      case DOUBLE:
        return indexRow.getDouble(pos);
      case BINARY:
      case VARBINARY:
        return indexRow.getBinary(pos);
      case CHAR:
      case VARCHAR:
        return indexRow.getString(pos).toString();
      case DECIMAL:
        DecimalType decimalType = (DecimalType) colType;
        return indexRow.getDecimal(pos, decimalType.getPrecision(), decimalType.getScale()).toBigDecimal();
      default:
        throw new UnsupportedOperationException("Unsupported type: " + colType);
    }
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/HoodieTableSink.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/HoodieTableSink.java
@@ -67,7 +67,7 @@ public class HoodieTableSink implements DynamicTableSink, SupportsPartitioning,
          .getCheckpointConfig().getCheckpointTimeout();
      conf.setLong(FlinkOptions.WRITE_COMMIT_ACK_TIMEOUT, ckpTimeout);
-      RowType rowType = (RowType) schema.toSourceRowDataType().notNull().getLogicalType();
+      RowType rowType = (RowType) schema.toSinkRowDataType().notNull().getLogicalType();
      // bulk_insert mode
      final String writeOperation = this.conf.get(FlinkOptions.OPERATION);
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/HoodieTableSource.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/HoodieTableSource.java
@@ -20,6 +20,7 @@ package org.apache.hudi.table;
 import org.apache.hudi.avro.HoodieAvroUtils;
 import org.apache.hudi.common.model.BaseFile;
 import org.apache.hudi.common.model.HoodieBaseFile;
 import org.apache.hudi.common.model.HoodieCommitMetadata;
 import org.apache.hudi.common.model.HoodieLogFile;
 import org.apache.hudi.common.model.HoodieTableType;
@@ -34,7 +35,6 @@ import org.apache.hudi.configuration.FlinkOptions;
 import org.apache.hudi.configuration.HadoopConfigurations;
 import org.apache.hudi.configuration.OptionsResolver;
 import org.apache.hudi.exception.HoodieException;
 import org.apache.hudi.hadoop.HoodieROTablePathFilter;
 import org.apache.hudi.source.FileIndex;
 import org.apache.hudi.source.IncrementalInputSplits;
 import org.apache.hudi.source.StreamReadMonitoringFunction;
@@ -46,13 +46,12 @@ import org.apache.hudi.table.format.mor.MergeOnReadInputSplit;
 import org.apache.hudi.table.format.mor.MergeOnReadTableState;
 import org.apache.hudi.util.AvroSchemaConverter;
 import org.apache.hudi.util.ChangelogModes;
 import org.apache.hudi.util.ExpressionUtils;
 import org.apache.hudi.util.InputFormats;
 import org.apache.hudi.util.StreamerUtil;
 import org.apache.avro.Schema;
 import org.apache.flink.annotation.VisibleForTesting;
 import org.apache.flink.api.common.io.FileInputFormat;
 import org.apache.flink.api.common.io.FilePathFilter;
 import org.apache.flink.api.common.io.InputFormat;
 import org.apache.flink.api.common.typeinfo.TypeInformation;
 import org.apache.flink.configuration.Configuration;
@@ -73,7 +72,6 @@ import org.apache.flink.table.connector.source.abilities.SupportsLimitPushDown;
 import org.apache.flink.table.connector.source.abilities.SupportsPartitionPushDown;
 import org.apache.flink.table.connector.source.abilities.SupportsProjectionPushDown;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.expressions.ResolvedExpression;
 import org.apache.flink.table.runtime.types.TypeInfoDataTypeConverter;
 import org.apache.flink.table.types.DataType;
@@ -117,6 +115,7 @@ public class HoodieTableSource implements
  private final long maxCompactionMemoryInBytes;
  private final ResolvedSchema schema;
  private final RowType tableRowType;
  private final Path path;
  private final List<String> partitionKeys;
  private final String defaultPartName;
@@ -125,7 +124,7 @@ public class HoodieTableSource implements
  private int[] requiredPos;
  private long limit;
-  private List<Expression> filters;
+  private List<ResolvedExpression> filters;
  private List<Map<String, String>> requiredPartitions;
@@ -147,21 +146,22 @@ public class HoodieTableSource implements
      @Nullable List<Map<String, String>> requiredPartitions,
      @Nullable int[] requiredPos,
      @Nullable Long limit,
-      @Nullable List<Expression> filters) {
+      @Nullable List<ResolvedExpression> filters) {
    this.schema = schema;
    this.tableRowType = (RowType) schema.toPhysicalRowDataType().notNull().getLogicalType();
    this.path = path;
    this.partitionKeys = partitionKeys;
    this.defaultPartName = defaultPartName;
    this.conf = conf;
    this.fileIndex = FileIndex.instance(this.path, this.conf);
    this.requiredPartitions = requiredPartitions;
    this.requiredPos = requiredPos == null
-        ? IntStream.range(0, schema.toPhysicalRowDataType().getChildren().size()).toArray()
+        ? IntStream.range(0, this.tableRowType.getFieldCount()).toArray()
        : requiredPos;
    this.limit = limit == null ? NO_LIMIT_CONSTANT : limit;
    this.filters = filters == null ? Collections.emptyList() : filters;
    this.hadoopConf = HadoopConfigurations.getHadoopConf(conf);
    this.metaClient = StreamerUtil.metaClientForReader(conf, hadoopConf);
    this.fileIndex = FileIndex.instance(this.path, this.conf, this.tableRowType);
    this.maxCompactionMemoryInBytes = StreamerUtil.getMaxCompactionMemoryInBytes(conf);
  }
@@ -181,12 +181,12 @@ public class HoodieTableSource implements
            (TypeInformation<RowData>) TypeInfoDataTypeConverter.fromDataTypeToTypeInfo(getProducedDataType());
        if (conf.getBoolean(FlinkOptions.READ_AS_STREAMING)) {
          StreamReadMonitoringFunction monitoringFunction = new StreamReadMonitoringFunction(
-              conf, FilePathUtils.toFlinkPath(path), maxCompactionMemoryInBytes, getRequiredPartitionPaths());
+              conf, FilePathUtils.toFlinkPath(path), tableRowType, maxCompactionMemoryInBytes, getRequiredPartitionPaths());
          InputFormat<RowData, ?> inputFormat = getInputFormat(true);
          OneInputStreamOperatorFactory<MergeOnReadInputSplit, RowData> factory = StreamReadOperator.factory((MergeOnReadInputFormat) inputFormat);
          SingleOutputStreamOperator<RowData> source = execEnv.addSource(monitoringFunction, getSourceOperatorName("split_monitor"))
              .setParallelism(1)
-              .keyBy(inputSplit -> inputSplit.getFileId())
+              .keyBy(MergeOnReadInputSplit::getFileId)
              .transform("split_reader", typeInfo, factory)
              .setParallelism(conf.getInteger(FlinkOptions.READ_TASKS));
          return new DataStreamSource<>(source);
@@ -219,7 +219,8 @@ public class HoodieTableSource implements
  @Override
  public Result applyFilters(List<ResolvedExpression> filters) {
-    this.filters = new ArrayList<>(filters);
+    this.filters = filters.stream().filter(ExpressionUtils::isSimpleCallExpression).collect(Collectors.toList());
    this.fileIndex.setFilters(this.filters);
    // refuse all the filters now
    return SupportsFilterPushDown.Result.of(Collections.emptyList(), new ArrayList<>(filters));
  }
@@ -262,13 +263,6 @@ public class HoodieTableSource implements
        .bridgedTo(RowData.class);
  }
  private List<Map<String, String>> getOrFetchPartitions() {
    if (requiredPartitions == null) {
      requiredPartitions = listPartitions().orElse(Collections.emptyList());
    }
    return requiredPartitions;
  }
  private String getSourceOperatorName(String operatorName) {
    String[] schemaFieldNames = this.schema.getColumnNames().toArray(new String[0]);
    List<String> fields = Arrays.stream(this.requiredPos)
@@ -366,7 +360,9 @@ public class HoodieTableSource implements
        return baseFileOnlyInputFormat();
      case FlinkOptions.QUERY_TYPE_INCREMENTAL:
        IncrementalInputSplits incrementalInputSplits = IncrementalInputSplits.builder()
-            .conf(conf).path(FilePathUtils.toFlinkPath(path))
+            .conf(conf)
            .path(FilePathUtils.toFlinkPath(path))
            .rowType(this.tableRowType)
            .maxCompactionMemoryInBytes(maxCompactionMemoryInBytes)
            .requiredPartitions(getRequiredPartitionPaths()).build();
        final IncrementalInputSplits.Result result = incrementalInputSplits.inputSplits(metaClient, hadoopConf);
@@ -439,11 +435,18 @@ public class HoodieTableSource implements
  }
  private InputFormat<RowData, ?> baseFileOnlyInputFormat() {
-    final Path[] paths = getReadPaths();
+    final FileStatus[] fileStatuses = getReadFiles();
-    if (paths.length == 0) {
+    if (fileStatuses.length == 0) {
      return InputFormats.EMPTY_INPUT_FORMAT;
    }
-    FileInputFormat<RowData> format = new CopyOnWriteInputFormat(
+
    HoodieTableFileSystemView fsView = new HoodieTableFileSystemView(metaClient,
        metaClient.getCommitsAndCompactionTimeline().filterCompletedInstants(), fileStatuses);
    Path[] paths = fsView.getLatestBaseFiles()
        .map(HoodieBaseFile::getFileStatus)
        .map(FileStatus::getPath).toArray(Path[]::new);
    return new CopyOnWriteInputFormat(
        FilePathUtils.toFlinkPaths(paths),
        this.schema.getColumnNames().toArray(new String[0]),
        this.schema.getColumnDataTypes().toArray(new DataType[0]),
@@ -453,12 +456,10 @@ public class HoodieTableSource implements
        getParquetConf(this.conf, this.hadoopConf),
        this.conf.getBoolean(FlinkOptions.UTC_TIMEZONE)
    );
    format.setFilesFilter(new LatestFileFilter(this.hadoopConf));
    return format;
  }
  private Schema inferSchemaFromDdl() {
-    Schema schema = AvroSchemaConverter.convertToSchema(this.schema.toPhysicalRowDataType().getLogicalType());
+    Schema schema = AvroSchemaConverter.convertToSchema(this.tableRowType);
    return HoodieAvroUtils.addMetadataFields(schema, conf.getBoolean(FlinkOptions.CHANGELOG_ENABLED));
  }
@@ -498,23 +499,13 @@ public class HoodieTableSource implements
   * Get the reader paths with partition path expanded.
   */
  @VisibleForTesting
-  public Path[] getReadPaths() {
+  public FileStatus[] getReadFiles() {
-    return partitionKeys.isEmpty()
+    Set<String> requiredPartitionPaths = getRequiredPartitionPaths();
-        ? new Path[] {path}
+    fileIndex.setPartitionPaths(requiredPartitionPaths);
-        : FilePathUtils.partitionPath2ReadPath(path, partitionKeys, getOrFetchPartitions(),
+    List<String> relPartitionPaths = fileIndex.getOrBuildPartitionPaths();
-        conf.getBoolean(FlinkOptions.HIVE_STYLE_PARTITIONING));
+    if (relPartitionPaths.size() == 0) {
-  }
+      return new FileStatus[0];
  private static class LatestFileFilter extends FilePathFilter {
    private final HoodieROTablePathFilter hoodieFilter;
    public LatestFileFilter(org.apache.hadoop.conf.Configuration hadoopConf) {
      this.hoodieFilter = new HoodieROTablePathFilter(hadoopConf);
    }
    @Override
    public boolean filterPath(org.apache.flink.core.fs.Path filePath) {
      return !this.hoodieFilter.accept(new Path(filePath.toUri()));
    }
    return fileIndex.getFilesInPartitions();
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/format/FilePathUtils.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/table/format/FilePathUtils.java
@@ -323,6 +323,10 @@ public class FilePathUtils {
  public static LinkedHashMap<String, String> validateAndReorderPartitions(
      Map<String, String> partitionKVs,
      List<String> partitionKeys) {
    if (partitionKeys.size() == 0) {
      // in case the partition fields are not in schema
      return new LinkedHashMap<>(partitionKVs);
    }
    LinkedHashMap<String, String> map = new LinkedHashMap<>();
    for (String k : partitionKeys) {
      if (!partitionKVs.containsKey(k)) {
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/AvroSchemaConverter.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/AvroSchemaConverter.java
@@ -39,6 +39,7 @@ import org.apache.flink.table.types.logical.TypeInformationRawType;
 import org.apache.flink.table.types.logical.utils.LogicalTypeChecks;
 import java.util.List;
 import java.util.stream.Collectors;
 /**
 * Converts an Avro schema into Flink's type information. It uses {@link org.apache.flink.api.java.typeutils.RowTypeInfo} for
@@ -96,9 +97,24 @@ public class AvroSchemaConverter {
          actualSchema = schema.getTypes().get(0);
          nullable = false;
        } else {
          List<Schema> nonNullTypes = schema.getTypes().stream()
              .filter(s -> s.getType() != Schema.Type.NULL)
              .collect(Collectors.toList());
          nullable = schema.getTypes().size() > nonNullTypes.size();
          // use Kryo for serialization
-          return new AtomicDataType(
+          DataType rawDataType = new AtomicDataType(
-              new TypeInformationRawType<>(false, Types.GENERIC(Object.class)));
+              new TypeInformationRawType<>(false, Types.GENERIC(Object.class)))
              .notNull();
          if (recordTypesOfSameNumFields(nonNullTypes)) {
            DataType converted = DataTypes.ROW(
                DataTypes.FIELD("wrapper", rawDataType))
                .notNull();
            return nullable ? converted.nullable() : converted;
          }
          // use Kryo for serialization
          return nullable ? rawDataType.nullable() : rawDataType;
        }
        DataType converted = convertToDataType(actualSchema);
        return nullable ? converted.nullable() : converted;
@@ -155,6 +171,20 @@ public class AvroSchemaConverter {
    }
  }
  /**
   * Returns true if all the types are RECORD type with same number of fields.
   */
  private static boolean recordTypesOfSameNumFields(List<Schema> types) {
    if (types == null || types.size() == 0) {
      return false;
    }
    if (types.stream().anyMatch(s -> s.getType() != Schema.Type.RECORD)) {
      return false;
    }
    int numFields = types.get(0).getFields().size();
    return types.stream().allMatch(s -> s.getFields().size() == numFields);
  }
  /**
   * Converts Flink SQL {@link LogicalType} (can be nested) into an Avro schema.
   *
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/AvroToRowDataConverters.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/AvroToRowDataConverters.java
@@ -106,7 +106,7 @@ public class AvroToRowDataConverters {
  /**
   * Creates a runtime converter which assuming input object is not null.
   */
-  private static AvroToRowDataConverter createConverter(LogicalType type) {
+  public static AvroToRowDataConverter createConverter(LogicalType type) {
    switch (type.getTypeRoot()) {
      case NULL:
        return avroObject -> null;
@@ -121,6 +121,7 @@ public class AvroToRowDataConverters {
      case INTERVAL_DAY_TIME: // long
      case FLOAT: // float
      case DOUBLE: // double
      case RAW:
        return avroObject -> avroObject;
      case DATE:
        return AvroToRowDataConverters::convertToDate;
@@ -143,7 +144,6 @@ public class AvroToRowDataConverters {
      case MAP:
      case MULTISET:
        return createMapConverter(type);
      case RAW:
      default:
        throw new UnsupportedOperationException("Unsupported type: " + type);
    }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/DataTypeUtils.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/DataTypeUtils.java
@@ -23,8 +23,11 @@ import org.apache.hudi.common.util.ValidationUtils;
 import org.apache.flink.table.types.DataType;
 import org.apache.flink.table.types.logical.LogicalType;
 import org.apache.flink.table.types.logical.LogicalTypeRoot;
 import org.apache.flink.table.types.logical.RowType;
 import org.apache.flink.table.types.logical.TimestampType;
 import java.util.Arrays;
 /**
 * Utilities for {@link org.apache.flink.table.types.DataType}.
 */
@@ -58,4 +61,12 @@ public class DataTypeUtils {
  public static boolean isDatetimeType(DataType type) {
    return isTimestampType(type) || isDateType(type);
  }
  /**
   * Projects the row fields with given names.
   */
  public static RowType.RowField[] projectRowFields(RowType rowType, String[] names) {
    int [] fieldIndices = Arrays.stream(names).mapToInt(rowType::getFieldIndex).toArray();
    return Arrays.stream(fieldIndices).mapToObj(i -> rowType.getFields().get(i)).toArray(RowType.RowField[]::new);
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/ExpressionUtils.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/ExpressionUtils.java
@@ -0,0 +1,180 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.util;
 import org.apache.flink.table.expressions.CallExpression;
 import org.apache.flink.table.expressions.Expression;
 import org.apache.flink.table.expressions.FieldReferenceExpression;
 import org.apache.flink.table.expressions.ResolvedExpression;
 import org.apache.flink.table.expressions.ValueLiteralExpression;
 import org.apache.flink.table.functions.BuiltInFunctionDefinitions;
 import org.apache.flink.table.functions.FunctionDefinition;
 import org.apache.flink.table.types.logical.LogicalType;
 import javax.annotation.Nullable;
 import java.math.BigDecimal;
 import java.time.LocalDate;
 import java.time.LocalDateTime;
 import java.time.LocalTime;
 import java.time.ZoneOffset;
 import java.time.temporal.ChronoField;
 import java.util.Arrays;
 import java.util.List;
 /**
 * Utilities for expression resolving.
 */
 public class ExpressionUtils {
  /**
   * Collect the referenced columns with given expressions,
   * only simple call expression is supported.
   */
  public static String[] referencedColumns(List<ResolvedExpression> exprs) {
    return exprs.stream()
        .map(ExpressionUtils::getReferencedColumns)
        .filter(columns -> columns.length > 0)
        .flatMap(Arrays::stream)
        .distinct() // deduplication
        .toArray(String[]::new);
  }
  /**
   * Returns whether the given expression is simple call expression:
   * a binary call with one operand as field reference and another operand
   * as literal.
   */
  public static boolean isSimpleCallExpression(Expression expr) {
    if (!(expr instanceof CallExpression)) {
      return false;
    }
    CallExpression callExpression = (CallExpression) expr;
    FunctionDefinition funcDef = callExpression.getFunctionDefinition();
    // simple call list:
    // NOT AND OR IN EQUALS NOT_EQUALS IS_NULL IS_NOT_NULL LESS_THAN GREATER_THAN
    // LESS_THAN_OR_EQUAL GREATER_THAN_OR_EQUAL
    if (funcDef == BuiltInFunctionDefinitions.NOT
        || funcDef == BuiltInFunctionDefinitions.AND
        || funcDef == BuiltInFunctionDefinitions.OR) {
      return callExpression.getChildren().stream()
          .allMatch(ExpressionUtils::isSimpleCallExpression);
    }
    if (!(funcDef == BuiltInFunctionDefinitions.IN
        || funcDef == BuiltInFunctionDefinitions.EQUALS
        || funcDef == BuiltInFunctionDefinitions.NOT_EQUALS
        || funcDef == BuiltInFunctionDefinitions.IS_NULL
        || funcDef == BuiltInFunctionDefinitions.IS_NOT_NULL
        || funcDef == BuiltInFunctionDefinitions.LESS_THAN
        || funcDef == BuiltInFunctionDefinitions.GREATER_THAN
        || funcDef == BuiltInFunctionDefinitions.LESS_THAN_OR_EQUAL
        || funcDef == BuiltInFunctionDefinitions.GREATER_THAN_OR_EQUAL)) {
      return false;
    }
    // handle IN
    if (funcDef == BuiltInFunctionDefinitions.IN) {
      // In expression RHS operands are always literals
      return true;
    }
    // handle unary operator
    if (funcDef == BuiltInFunctionDefinitions.IS_NULL
        || funcDef == BuiltInFunctionDefinitions.IS_NOT_NULL) {
      return callExpression.getChildren().stream()
          .allMatch(e -> e instanceof FieldReferenceExpression);
    }
    // handle binary operator
    return isFieldReferenceAndLiteral(callExpression.getChildren());
  }
  private static boolean isFieldReferenceAndLiteral(List<Expression> exprs) {
    if (exprs.size() != 2) {
      return false;
    }
    final Expression expr0 = exprs.get(0);
    final Expression expr1 = exprs.get(1);
    return expr0 instanceof FieldReferenceExpression && expr1 instanceof ValueLiteralExpression
        || expr0 instanceof ValueLiteralExpression && expr1 instanceof FieldReferenceExpression;
  }
  private static String[] getReferencedColumns(ResolvedExpression expression) {
    CallExpression callExpr = (CallExpression) expression;
    FunctionDefinition funcDef = callExpr.getFunctionDefinition();
    if (funcDef == BuiltInFunctionDefinitions.NOT
        || funcDef == BuiltInFunctionDefinitions.AND
        || funcDef == BuiltInFunctionDefinitions.OR) {
      return callExpr.getChildren().stream()
          .map(e -> getReferencedColumns((ResolvedExpression) e))
          .flatMap(Arrays::stream)
          .toArray(String[]::new);
    }
    return expression.getChildren().stream()
        .filter(expr -> expr instanceof FieldReferenceExpression)
        .map(expr -> ((FieldReferenceExpression) expr).getName())
        .toArray(String[]::new);
  }
  /**
   * Returns the value with given value literal expression.
   *
   * <p>Returns null if the value can not parse as the output data type correctly,
   * should call {@code ValueLiteralExpression.isNull} first to decide whether
   * the literal is NULL.
   */
  @Nullable
  public static Object getValueFromLiteral(ValueLiteralExpression expr) {
    LogicalType logicalType = expr.getOutputDataType().getLogicalType();
    switch (logicalType.getTypeRoot()) {
      case TIMESTAMP_WITHOUT_TIME_ZONE:
        return expr.getValueAs(LocalDateTime.class)
            .map(ldt -> ldt.toInstant(ZoneOffset.UTC).toEpochMilli())
            .orElse(null);
      case TIME_WITHOUT_TIME_ZONE:
        return expr.getValueAs(LocalTime.class)
            .map(lt -> lt.get(ChronoField.MILLI_OF_DAY))
            .orElse(null);
      case DATE:
        return expr.getValueAs(LocalDate.class)
            .map(LocalDate::toEpochDay)
            .orElse(null);
      // NOTE: All integral types of size less than Int are encoded as Ints in MT
      case BOOLEAN:
        return expr.getValueAs(Boolean.class).orElse(null);
      case TINYINT:
      case SMALLINT:
      case INTEGER:
        return expr.getValueAs(Integer.class).orElse(null);
      case FLOAT:
        return expr.getValueAs(Float.class).orElse(null);
      case DOUBLE:
        return expr.getValueAs(Double.class).orElse(null);
      case BINARY:
      case VARBINARY:
        return expr.getValueAs(byte[].class).orElse(null);
      case CHAR:
      case VARCHAR:
        return expr.getValueAs(String.class).orElse(null);
      case DECIMAL:
        return expr.getValueAs(BigDecimal.class).orElse(null);
      default:
        throw new UnsupportedOperationException("Unsupported type: " + logicalType);
    }
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/RowDataProjection.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/RowDataProjection.java
@@ -26,6 +26,8 @@ import org.apache.flink.table.types.logical.LogicalType;
 import org.apache.flink.table.types.logical.RowType;
 import java.io.Serializable;
 import java.util.Arrays;
 import java.util.List;
 /**
 * Utilities to project the row data with given positions.
@@ -51,6 +53,12 @@ public class RowDataProjection implements Serializable {
    return new RowDataProjection(types, positions);
  }
  public static RowDataProjection instanceV2(RowType rowType, int[] positions) {
    List<LogicalType> fieldTypes = rowType.getChildren();
    final LogicalType[] types = Arrays.stream(positions).mapToObj(fieldTypes::get).toArray(LogicalType[]::new);
    return new RowDataProjection(types, positions);
  }
  public static RowDataProjection instance(LogicalType[] types, int[] positions) {
    return new RowDataProjection(types, positions);
  }
--- a/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/ViewStorageProperties.java
+++ b/hudi-flink-datasource/hudi-flink/src/main/java/org/apache/hudi/util/ViewStorageProperties.java
@@ -18,12 +18,12 @@
 package org.apache.hudi.util;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hudi.common.fs.FSUtils;
 import org.apache.hudi.common.table.view.FileSystemViewStorageConfig;
 import org.apache.hudi.configuration.HadoopConfigurations;
 import org.apache.hudi.exception.HoodieIOException;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hadoop.fs.FSDataInputStream;
 import org.apache.hadoop.fs.FSDataOutputStream;
 import org.apache.hadoop.fs.FileSystem;
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/sink/utils/TestHiveSyncContext.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/sink/utils/TestHiveSyncContext.java
@@ -18,11 +18,10 @@
 package org.apache.hudi.sink.utils;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hudi.configuration.FlinkOptions;
 import org.apache.hudi.hive.HiveSyncConfig;
 import org.apache.flink.configuration.Configuration;
 import org.junit.jupiter.api.Test;
 import java.lang.reflect.Method;
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/TestFileIndex.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/TestFileIndex.java
@@ -58,7 +58,7 @@ public class TestFileIndex {
    conf.setBoolean(FlinkOptions.METADATA_ENABLED, true);
    conf.setBoolean(FlinkOptions.HIVE_STYLE_PARTITIONING, hiveStylePartitioning);
    TestData.writeData(TestData.DATA_SET_INSERT, conf);
-    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf);
+    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf, TestConfigurations.ROW_TYPE);
    List<String> partitionKeys = Collections.singletonList("partition");
    List<Map<String, String>> partitions = fileIndex.getPartitions(partitionKeys, "default", hiveStylePartitioning);
    assertTrue(partitions.stream().allMatch(m -> m.size() == 1));
@@ -79,7 +79,7 @@ public class TestFileIndex {
    conf.setString(FlinkOptions.KEYGEN_CLASS_NAME, NonpartitionedAvroKeyGenerator.class.getName());
    conf.setBoolean(FlinkOptions.METADATA_ENABLED, true);
    TestData.writeData(TestData.DATA_SET_INSERT, conf);
-    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf);
+    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf, TestConfigurations.ROW_TYPE);
    List<String> partitionKeys = Collections.singletonList("");
    List<Map<String, String>> partitions = fileIndex.getPartitions(partitionKeys, "default", false);
    assertThat(partitions.size(), is(0));
@@ -94,7 +94,7 @@ public class TestFileIndex {
  void testFileListingEmptyTable(boolean enableMetadata) {
    Configuration conf = TestConfigurations.getDefaultConf(tempFile.getAbsolutePath());
    conf.setBoolean(FlinkOptions.METADATA_ENABLED, enableMetadata);
-    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf);
+    FileIndex fileIndex = FileIndex.instance(new Path(tempFile.getAbsolutePath()), conf, TestConfigurations.ROW_TYPE);
    List<String> partitionKeys = Collections.singletonList("partition");
    List<Map<String, String>> partitions = fileIndex.getPartitions(partitionKeys, "default", false);
    assertThat(partitions.size(), is(0));
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/stats/TestColumnStatsIndices.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/stats/TestColumnStatsIndices.java
@@ -0,0 +1,98 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.source.stats;
 import org.apache.hudi.common.config.HoodieMetadataConfig;
 import org.apache.hudi.common.util.collection.Pair;
 import org.apache.hudi.configuration.FlinkOptions;
 import org.apache.hudi.utils.TestConfigurations;
 import org.apache.hudi.utils.TestData;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.table.data.GenericRowData;
 import org.apache.flink.table.data.RowData;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.io.TempDir;
 import java.io.File;
 import java.util.Arrays;
 import java.util.Comparator;
 import java.util.List;
 import java.util.stream.Collectors;
 import static org.hamcrest.CoreMatchers.is;
 import static org.hamcrest.MatcherAssert.assertThat;
 import static org.junit.jupiter.api.Assertions.assertThrows;
 /**
 * Test cases for {@link ColumnStatsIndices}.
 */
 public class TestColumnStatsIndices {
  @TempDir
  File tempFile;
  @Test
  void testTransposeColumnStatsIndex() throws Exception {
    final String path = tempFile.getAbsolutePath();
    Configuration conf = TestConfigurations.getDefaultConf(path);
    conf.setBoolean(FlinkOptions.METADATA_ENABLED, true);
    conf.setBoolean(FlinkOptions.READ_DATA_SKIPPING_ENABLED, true);
    conf.setString("hoodie.metadata.index.column.stats.enable", "true");
    HoodieMetadataConfig metadataConfig = HoodieMetadataConfig.newBuilder()
        .enable(true)
        .withMetadataIndexColumnStats(true)
        .build();
    TestData.writeData(TestData.DATA_SET_INSERT, conf);
    // explicit query columns
    String[] queryColumns1 = {"uuid", "age"};
    List<RowData> indexRows1 = ColumnStatsIndices.readColumnStatsIndex(path, metadataConfig, queryColumns1);
    Pair<List<RowData>, String[]> transposedIndexTable1 = ColumnStatsIndices
        .transposeColumnStatsIndex(indexRows1, queryColumns1, TestConfigurations.ROW_TYPE);
    assertThat("The schema columns should sort by natural order",
        Arrays.toString(transposedIndexTable1.getRight()), is("[age, uuid]"));
    List<RowData> transposed1 = filterOutFileNames(transposedIndexTable1.getLeft());
    assertThat(transposed1.size(), is(4));
    final String expected = "["
        + "+I(2,18,20,0,id5,id6,0), "
        + "+I(2,23,33,0,id1,id2,0), "
        + "+I(2,31,53,0,id3,id4,0), "
        + "+I(2,44,56,0,id7,id8,0)]";
    assertThat(transposed1.toString(), is(expected));
    // no query columns, only for tests
    assertThrows(IllegalArgumentException.class,
        () -> ColumnStatsIndices.readColumnStatsIndex(path, metadataConfig, new String[0]));
  }
  private static List<RowData> filterOutFileNames(List<RowData> indexRows) {
    return indexRows.stream().map(row -> {
      GenericRowData gr = (GenericRowData) row;
      GenericRowData converted = new GenericRowData(gr.getArity() - 1);
      for (int i = 1; i < gr.getArity(); i++) {
        converted.setField(i - 1, gr.getField(i));
      }
      return converted;
    })
        // sort by age min values
        .sorted(Comparator.comparingInt(r -> r.getInt(1)))
        .collect(Collectors.toList());
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/stats/TestExpressionEvaluator.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/source/stats/TestExpressionEvaluator.java
@@ -0,0 +1,374 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.source.stats;
 import org.apache.hudi.utils.TestData;
 import org.apache.flink.table.api.DataTypes;
 import org.apache.flink.table.data.RowData;
 import org.apache.flink.table.data.StringData;
 import org.apache.flink.table.data.TimestampData;
 import org.apache.flink.table.expressions.FieldReferenceExpression;
 import org.apache.flink.table.expressions.ValueLiteralExpression;
 import org.apache.flink.table.types.DataType;
 import org.apache.flink.table.types.logical.RowType;
 import org.junit.jupiter.api.Test;
 import java.util.Arrays;
 import java.util.List;
 import static org.junit.jupiter.api.Assertions.assertFalse;
 import static org.junit.jupiter.api.Assertions.assertTrue;
 /**
 * Test cases for {@link ExpressionEvaluator}.
 */
 public class TestExpressionEvaluator {
  private static final DataType ROW_DATA_TYPE = DataTypes.ROW(
      DataTypes.FIELD("f_tinyint", DataTypes.TINYINT()),
      DataTypes.FIELD("f_smallint", DataTypes.SMALLINT()),
      DataTypes.FIELD("f_int", DataTypes.INT()),
      DataTypes.FIELD("f_long", DataTypes.BIGINT()),
      DataTypes.FIELD("f_float", DataTypes.FLOAT()),
      DataTypes.FIELD("f_double", DataTypes.DOUBLE()),
      DataTypes.FIELD("f_boolean", DataTypes.BOOLEAN()),
      DataTypes.FIELD("f_decimal", DataTypes.DECIMAL(10, 2)),
      DataTypes.FIELD("f_bytes", DataTypes.VARBINARY(10)),
      DataTypes.FIELD("f_string", DataTypes.VARCHAR(10)),
      DataTypes.FIELD("f_time", DataTypes.TIME(3)),
      DataTypes.FIELD("f_date", DataTypes.DATE()),
      DataTypes.FIELD("f_timestamp", DataTypes.TIMESTAMP(3))
      ).notNull();
  private static final DataType INDEX_ROW_DATA_TYPE = DataTypes.ROW(
      DataTypes.FIELD("file_name", DataTypes.STRING()),
      DataTypes.FIELD("value_cnt", DataTypes.BIGINT()),
      DataTypes.FIELD("f_int_min", DataTypes.INT()),
      DataTypes.FIELD("f_int_max", DataTypes.INT()),
      DataTypes.FIELD("f_int_null_cnt", DataTypes.BIGINT()),
      DataTypes.FIELD("f_string_min", DataTypes.VARCHAR(10)),
      DataTypes.FIELD("f_string_max", DataTypes.VARCHAR(10)),
      DataTypes.FIELD("f_string_null_cnt", DataTypes.BIGINT()),
      DataTypes.FIELD("f_timestamp_min", DataTypes.TIMESTAMP(3)),
      DataTypes.FIELD("f_timestamp_max", DataTypes.TIMESTAMP(3)),
      DataTypes.FIELD("f_timestamp_null_cnt", DataTypes.BIGINT())
  ).notNull();
  private static final RowType INDEX_ROW_TYPE = (RowType) INDEX_ROW_DATA_TYPE.getLogicalType();
  @Test
  void testEqualTo() {
    ExpressionEvaluator.EqualTo equalTo = ExpressionEvaluator.EqualTo.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    equalTo.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(equalTo.eval(), "11 < 12 < 13");
    RowData indexRow2 = intIndexRow(12, 13);
    equalTo.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(equalTo.eval(), "12 <= 12 < 13");
    RowData indexRow3 = intIndexRow(11, 12);
    equalTo.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(equalTo.eval(), "11 < 12 <= 12");
    RowData indexRow4 = intIndexRow(10, 11);
    equalTo.bindColStats(indexRow4, queryFields(2), rExpr);
    assertFalse(equalTo.eval(), "11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    equalTo.bindColStats(indexRow5, queryFields(2), rExpr);
    assertFalse(equalTo.eval(), "12 < 13");
    RowData indexRow6 = intIndexRow(null, null);
    equalTo.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(equalTo.eval(), "12 <> null");
    equalTo.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertFalse(equalTo.eval(), "null <> null");
  }
  @Test
  void testNotEqualTo() {
    ExpressionEvaluator.NotEqualTo notEqualTo = ExpressionEvaluator.NotEqualTo.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    notEqualTo.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "11 <> 12 && 12 <> 13");
    RowData indexRow2 = intIndexRow(12, 13);
    notEqualTo.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "12 <> 13");
    RowData indexRow3 = intIndexRow(11, 12);
    notEqualTo.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "11 <> 12");
    RowData indexRow4 = intIndexRow(10, 11);
    notEqualTo.bindColStats(indexRow4, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "10 <> 12 and 11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    notEqualTo.bindColStats(indexRow5, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "12 <> 13 and 12 <> 14");
    RowData indexRow6 = intIndexRow(null, null);
    notEqualTo.bindColStats(indexRow6, queryFields(2), rExpr);
    assertTrue(notEqualTo.eval(), "12 <> null");
    notEqualTo.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertTrue(notEqualTo.eval(), "null <> null");
  }
  @Test
  void testIsNull() {
    ExpressionEvaluator.IsNull isNull = ExpressionEvaluator.IsNull.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    RowData indexRow1 = intIndexRow(11, 13);
    isNull.bindFieldReference(rExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(isNull.eval(), "2 nulls");
    RowData indexRow2 = intIndexRow(12, 13, 0L);
    isNull.bindColStats(indexRow2, queryFields(2), rExpr);
    assertFalse(isNull.eval(), "0 nulls");
  }
  @Test
  void testIsNotNull() {
    ExpressionEvaluator.IsNotNull isNotNull = ExpressionEvaluator.IsNotNull.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    RowData indexRow1 = intIndexRow(11, 13);
    isNotNull.bindFieldReference(rExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(isNotNull.eval(), "min 11 is not null");
    RowData indexRow2 = intIndexRow(null, null, 0L);
    isNotNull.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(isNotNull.eval(), "min is null and 0 nulls");
  }
  @Test
  void testLessThan() {
    ExpressionEvaluator.LessThan lessThan = ExpressionEvaluator.LessThan.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    lessThan.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(lessThan.eval(), "12 < 13");
    RowData indexRow2 = intIndexRow(12, 13);
    lessThan.bindColStats(indexRow2, queryFields(2), rExpr);
    assertFalse(lessThan.eval(), "min 12 = 12");
    RowData indexRow3 = intIndexRow(11, 12);
    lessThan.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(lessThan.eval(), "11 < 12");
    RowData indexRow4 = intIndexRow(10, 11);
    lessThan.bindColStats(indexRow4, queryFields(2), rExpr);
    assertTrue(lessThan.eval(), "11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    lessThan.bindColStats(indexRow5, queryFields(2), rExpr);
    assertFalse(lessThan.eval(), "12 < min 13");
    RowData indexRow6 = intIndexRow(null, null);
    lessThan.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(lessThan.eval(), "12 <> null");
    lessThan.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertFalse(lessThan.eval(), "null <> null");
  }
  @Test
  void testGreaterThan() {
    ExpressionEvaluator.GreaterThan greaterThan = ExpressionEvaluator.GreaterThan.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    greaterThan.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(greaterThan.eval(), "12 < 13");
    RowData indexRow2 = intIndexRow(12, 13);
    greaterThan.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(greaterThan.eval(), "12 < 13");
    RowData indexRow3 = intIndexRow(11, 12);
    greaterThan.bindColStats(indexRow3, queryFields(2), rExpr);
    assertFalse(greaterThan.eval(), "max 12 = 12");
    RowData indexRow4 = intIndexRow(10, 11);
    greaterThan.bindColStats(indexRow4, queryFields(2), rExpr);
    assertFalse(greaterThan.eval(), "max 11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    greaterThan.bindColStats(indexRow5, queryFields(2), rExpr);
    assertTrue(greaterThan.eval(), "12 < 13");
    RowData indexRow6 = intIndexRow(null, null);
    greaterThan.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(greaterThan.eval(), "12 <> null");
    greaterThan.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertFalse(greaterThan.eval(), "null <> null");
  }
  @Test
  void testLessThanOrEqual() {
    ExpressionEvaluator.LessThanOrEqual lessThanOrEqual = ExpressionEvaluator.LessThanOrEqual.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    lessThanOrEqual.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(lessThanOrEqual.eval(), "11 < 12");
    RowData indexRow2 = intIndexRow(12, 13);
    lessThanOrEqual.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(lessThanOrEqual.eval(), "min 12 = 12");
    RowData indexRow3 = intIndexRow(11, 12);
    lessThanOrEqual.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(lessThanOrEqual.eval(), "max 12 = 12");
    RowData indexRow4 = intIndexRow(10, 11);
    lessThanOrEqual.bindColStats(indexRow4, queryFields(2), rExpr);
    assertTrue(lessThanOrEqual.eval(), "max 11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    lessThanOrEqual.bindColStats(indexRow5, queryFields(2), rExpr);
    assertFalse(lessThanOrEqual.eval(), "12 < 13");
    RowData indexRow6 = intIndexRow(null, null);
    lessThanOrEqual.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(lessThanOrEqual.eval(), "12 <> null");
    lessThanOrEqual.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertFalse(lessThanOrEqual.eval(), "null <> null");
  }
  @Test
  void testGreaterThanOrEqual() {
    ExpressionEvaluator.GreaterThanOrEqual greaterThanOrEqual = ExpressionEvaluator.GreaterThanOrEqual.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    ValueLiteralExpression vExpr = new ValueLiteralExpression(12);
    RowData indexRow1 = intIndexRow(11, 13);
    greaterThanOrEqual.bindFieldReference(rExpr)
        .bindVal(vExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    assertTrue(greaterThanOrEqual.eval(), "12 < 13");
    RowData indexRow2 = intIndexRow(12, 13);
    greaterThanOrEqual.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(greaterThanOrEqual.eval(), "min 12 = 12");
    RowData indexRow3 = intIndexRow(11, 12);
    greaterThanOrEqual.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(greaterThanOrEqual.eval(), "max 12 = 12");
    RowData indexRow4 = intIndexRow(10, 11);
    greaterThanOrEqual.bindColStats(indexRow4, queryFields(2), rExpr);
    assertFalse(greaterThanOrEqual.eval(), "max 11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    greaterThanOrEqual.bindColStats(indexRow5, queryFields(2), rExpr);
    assertTrue(greaterThanOrEqual.eval(), "12 < 13");
    RowData indexRow6 = intIndexRow(null, null);
    greaterThanOrEqual.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(greaterThanOrEqual.eval(), "12 <> null");
    greaterThanOrEqual.bindVal(new ValueLiteralExpression(null, DataTypes.INT()));
    assertFalse(greaterThanOrEqual.eval(), "null <> null");
  }
  @Test
  void testIn() {
    ExpressionEvaluator.In in = ExpressionEvaluator.In.getInstance();
    FieldReferenceExpression rExpr = new FieldReferenceExpression("f_int", DataTypes.INT(), 2, 2);
    RowData indexRow1 = intIndexRow(11, 13);
    in.bindFieldReference(rExpr)
        .bindColStats(indexRow1, queryFields(2), rExpr);
    in.bindVals(12);
    assertTrue(in.eval(), "11 < 12 < 13");
    RowData indexRow2 = intIndexRow(12, 13);
    in.bindColStats(indexRow2, queryFields(2), rExpr);
    assertTrue(in.eval(), "min 12 = 12");
    RowData indexRow3 = intIndexRow(11, 12);
    in.bindColStats(indexRow3, queryFields(2), rExpr);
    assertTrue(in.eval(), "max 12 = 12");
    RowData indexRow4 = intIndexRow(10, 11);
    in.bindColStats(indexRow4, queryFields(2), rExpr);
    assertFalse(in.eval(), "max 11 < 12");
    RowData indexRow5 = intIndexRow(13, 14);
    in.bindColStats(indexRow5, queryFields(2), rExpr);
    assertFalse(in.eval(), "12 < 13");
    RowData indexRow6 = intIndexRow(null, null);
    in.bindColStats(indexRow6, queryFields(2), rExpr);
    assertFalse(in.eval(), "12 <> null");
    in.bindVals((Object) null);
    assertFalse(in.eval(), "null <> null");
  }
  private static RowData intIndexRow(Integer minVal, Integer maxVal) {
    return intIndexRow(minVal, maxVal, 2L);
  }
  private static RowData intIndexRow(Integer minVal, Integer maxVal, Long nullCnt) {
    return indexRow(StringData.fromString("f1"), 100L,
        minVal, maxVal, nullCnt,
        StringData.fromString("1"), StringData.fromString("100"), 5L,
        TimestampData.fromEpochMillis(1), TimestampData.fromEpochMillis(100), 3L);
  }
  private static RowData indexRow(Object... fields) {
    return TestData.insertRow(INDEX_ROW_TYPE, fields);
  }
  private static RowType.RowField[] queryFields(int... pos) {
    List<RowType.RowField> fields = ((RowType) ROW_DATA_TYPE.getLogicalType()).getFields();
    return Arrays.stream(pos).mapToObj(fields::get).toArray(RowType.RowField[]::new);
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/table/ITTestHoodieDataSource.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/table/ITTestHoodieDataSource.java
@@ -1256,6 +1256,37 @@ public class ITTestHoodieDataSource extends AbstractTestBase {
    assertRowsEquals(partitionResult, "[+I[1, 2022-02-02]]");
  }
  @Test
  void testWriteAndReadWithDataSkipping() {
    TableEnvironment tableEnv = batchTableEnv;
    String hoodieTableDDL = sql("t1")
        .option(FlinkOptions.PATH, tempFile.getAbsolutePath())
        .option(FlinkOptions.METADATA_ENABLED, true)
        .option("hoodie.metadata.index.column.stats.enable", true)
        .option(FlinkOptions.READ_DATA_SKIPPING_ENABLED, true)
        .end();
    tableEnv.executeSql(hoodieTableDDL);
    execInsertSql(tableEnv, TestSQL.INSERT_T1);
    List<Row> result1 = CollectionUtil.iterableToList(
        () -> tableEnv.sqlQuery("select * from t1").execute().collect());
    assertRowsEquals(result1, TestData.DATA_SET_SOURCE_INSERT);
    // apply filters
    List<Row> result2 = CollectionUtil.iterableToList(
        () -> tableEnv.sqlQuery("select * from t1 where uuid > 'id5' and age > 20").execute().collect());
    assertRowsEquals(result2, "["
        + "+I[id7, Bob, 44, 1970-01-01T00:00:07, par4], "
        + "+I[id8, Han, 56, 1970-01-01T00:00:08, par4]]");
    // filter by timestamp
    List<Row> result3 = CollectionUtil.iterableToList(
        () -> tableEnv.sqlQuery("select * from t1 where ts > TIMESTAMP '1970-01-01 00:00:05'").execute().collect());
    assertRowsEquals(result3, "["
        + "+I[id6, Emma, 20, 1970-01-01T00:00:06, par3], "
        + "+I[id7, Bob, 44, 1970-01-01T00:00:07, par4], "
        + "+I[id8, Han, 56, 1970-01-01T00:00:08, par4]]");
  }
  // -------------------------------------------------------------------------
  //  Utilities
  // -------------------------------------------------------------------------
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/table/TestHoodieTableSource.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/table/TestHoodieTableSource.java
@@ -28,6 +28,7 @@ import org.apache.flink.api.common.io.FileInputFormat;
 import org.apache.flink.api.common.io.InputFormat;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.table.data.RowData;
 import org.apache.hadoop.fs.FileStatus;
 import org.apache.hadoop.fs.Path;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.function.ThrowingSupplier;
@@ -38,7 +39,6 @@ import org.slf4j.LoggerFactory;
 import java.io.File;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.Comparator;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.stream.Collectors;
@@ -76,22 +76,18 @@ public class TestHoodieTableSource {
        Arrays.asList(conf.getString(FlinkOptions.PARTITION_PATH_FIELD).split(",")),
        "default-par",
        conf);
-    Path[] paths = tableSource.getReadPaths();
+    FileStatus[] fileStatuses = tableSource.getReadFiles();
-    assertNotNull(paths);
+    assertNotNull(fileStatuses);
-    String[] names = Arrays.stream(paths).map(Path::getName)
+    assertThat(fileStatuses.length, is(4));
        .sorted(Comparator.naturalOrder()).toArray(String[]::new);
    assertThat(Arrays.toString(names), is("[par1, par2, par3, par4]"));
    // apply partition pruning
    Map<String, String> partitions = new HashMap<>();
    partitions.put("partition", "par1");
    tableSource.applyPartitions(Collections.singletonList(partitions));
-    Path[] paths2 = tableSource.getReadPaths();
+    FileStatus[] fileStatuses2 = tableSource.getReadFiles();
-    assertNotNull(paths2);
+    assertNotNull(fileStatuses2);
-    String[] names2 = Arrays.stream(paths2).map(Path::getName)
+    assertThat(fileStatuses2.length, is(1));
        .sorted(Comparator.naturalOrder()).toArray(String[]::new);
    assertThat(Arrays.toString(names2), is("[par1]"));
  }
  @Test
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestAvroSchemaConverter.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestAvroSchemaConverter.java
@@ -0,0 +1,53 @@
 /*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 package org.apache.hudi.utils;
 import org.apache.hudi.avro.model.HoodieMetadataRecord;
 import org.apache.hudi.metadata.HoodieMetadataPayload;
 import org.apache.hudi.util.AvroSchemaConverter;
 import org.apache.avro.Schema;
 import org.apache.flink.table.types.DataType;
 import org.junit.jupiter.api.Test;
 import static org.hamcrest.CoreMatchers.is;
 import static org.hamcrest.MatcherAssert.assertThat;
 /**
 * Test cases for {@link org.apache.hudi.util.AvroSchemaConverter}.
 */
 public class TestAvroSchemaConverter {
  @Test
  void testUnionSchemaWithMultipleRecordTypes() {
    Schema schema = HoodieMetadataRecord.SCHEMA$;
    DataType dataType = AvroSchemaConverter.convertToDataType(schema);
    int pos = HoodieMetadataRecord.SCHEMA$.getField(HoodieMetadataPayload.SCHEMA_FIELD_ID_COLUMN_STATS).pos();
    final String expected = "ROW<"
        + "`fileName` STRING, "
        + "`columnName` STRING, "
        + "`minValue` ROW<`wrapper` RAW('java.lang.Object', ?) NOT NULL>, "
        + "`maxValue` ROW<`wrapper` RAW('java.lang.Object', ?) NOT NULL>, "
        + "`valueCount` BIGINT, "
        + "`nullCount` BIGINT, "
        + "`totalSize` BIGINT, "
        + "`totalUncompressedSize` BIGINT, "
        + "`isDeleted` BOOLEAN NOT NULL>";
    assertThat(dataType.getChildren().get(pos).toString(), is(expected));
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestConfigurations.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestConfigurations.java
@@ -318,6 +318,9 @@ public class TestConfigurations {
    }
  }
  /**
   * Tool to construct the catalog DDL.
   */
  public static class Catalog {
    private final String catalogName;
    private String catalogPath = ".";
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestUtils.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestUtils.java
@@ -97,6 +97,6 @@ public class TestUtils {
  public static StreamReadMonitoringFunction getMonitorFunc(Configuration conf) {
    final String basePath = conf.getString(FlinkOptions.PATH);
-    return new StreamReadMonitoringFunction(conf, new Path(basePath), 1024 * 1024L, null);
+    return new StreamReadMonitoringFunction(conf, new Path(basePath), TestConfigurations.ROW_TYPE, 1024 * 1024L, null);
  }
 }
--- a/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestViewStorageProperties.java
+++ b/hudi-flink-datasource/hudi-flink/src/test/java/org/apache/hudi/utils/TestViewStorageProperties.java
@@ -18,11 +18,11 @@
 package org.apache.hudi.utils;
 import org.apache.flink.configuration.Configuration;
 import org.apache.hudi.common.table.view.FileSystemViewStorageConfig;
 import org.apache.hudi.common.table.view.FileSystemViewStorageType;
 import org.apache.hudi.util.ViewStorageProperties;
 import org.apache.flink.configuration.Configuration;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.io.TempDir;