CodeStyle formatting to conform to basic Checkstyle rules.

The code-style rules follow google style with some changes: 1. Increase line length from 100 to 120 2. Disable JavaDoc related checkstyles as this needs more manual work. Both source and test code are checked for code-style
2018-03-20 16:29:20 -07:00
parent 987f5d6b96
commit 788e4f2d2e
200 changed files with 6209 additions and 5975 deletions
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/HiveSyncConfig.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/HiveSyncConfig.java
@@ -48,15 +48,23 @@ public class HiveSyncConfig implements Serializable {
      "--base-path"}, description = "Basepath of hoodie dataset to sync", required = true)
  public String basePath;

-  @Parameter(names = "--partitioned-by", description = "Fields in the schema partitioned by", required = true)
+  @Parameter(names = "--partitioned-by", description = "Fields in the schema partitioned by",
+      required = true)
  public List<String> partitionFields = new ArrayList<>();

-  @Parameter(names = "-partition-value-extractor", description = "Class which implements PartitionValueExtractor to extract the partition values from HDFS path")
+  @Parameter(names = "-partition-value-extractor", description = "Class which implements "
+      + "PartitionValueExtractor "
+      + "to extract the partition "
+      + "values from HDFS path")
  public String partitionValueExtractorClass = SlashEncodedDayPartitionValueExtractor.class
      .getName();

  @Parameter(names = {
-      "--assume-date-partitioning"}, description = "Assume standard yyyy/mm/dd partitioning, this exists to support backward compatibility. If you use hoodie 0.3.x, do not set this parameter")
+      "--assume-date-partitioning"}, description = "Assume standard yyyy/mm/dd partitioning, this"
+      + " exists to support "
+      + "backward compatibility. If"
+      + " you use hoodie 0.3.x, do "
+      + "not set this parameter")
  public Boolean assumeDatePartitioning = false;

  @Parameter(names = {"--help", "-h"}, help = true)
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/HiveSyncTool.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/HiveSyncTool.java
@@ -45,16 +45,16 @@ import parquet.schema.MessageType;
 * Tool to sync a hoodie HDFS dataset with a hive metastore table. Either use it as a api
 * HiveSyncTool.syncHoodieTable(HiveSyncConfig) or as a command line java -cp hoodie-hive.jar
 * HiveSyncTool [args]
- *
+ * <p>
 * This utility will get the schema from the latest commit and will sync hive table schema Also this
 * will sync the partitions incrementally (all the partitions modified since the last commit)
 */
@SuppressWarnings("WeakerAccess")
 public class HiveSyncTool {

-  private static Logger LOG = LoggerFactory.getLogger(HiveSyncTool.class);
+  private static final Logger LOG = LoggerFactory.getLogger(HiveSyncTool.class);
  private final HoodieHiveClient hoodieHiveClient;
-  public final static String SUFFIX_REALTIME_TABLE = "_rt";
+  public static final String SUFFIX_REALTIME_TABLE = "_rt";
  private final HiveSyncConfig cfg;

  public HiveSyncTool(HiveSyncConfig cfg, HiveConf configuration, FileSystem fs) {
@@ -85,9 +85,8 @@ public class HiveSyncTool {
  }

  private void syncHoodieTable(boolean isRealTime) {
-    LOG.info("Trying to sync hoodie table " + cfg.tableName + " with base path " + hoodieHiveClient
-        .getBasePath() + " of type " + hoodieHiveClient
-        .getTableType());
+    LOG.info("Trying to sync hoodie table " + cfg.tableName + " with base path "
+        + hoodieHiveClient.getBasePath() + " of type " + hoodieHiveClient.getTableType());

    // Check if the necessary table exists
    boolean tableExists = hoodieHiveClient.doesTableExist();
@@ -118,27 +117,29 @@ public class HiveSyncTool {
   * If not, evolves the table schema.
   *
   * @param tableExists - does table exist
-   * @param schema - extracted schema
+   * @param schema      - extracted schema
   */
  private void syncSchema(boolean tableExists, boolean isRealTime, MessageType schema) {
    // Check and sync schema
    if (!tableExists) {
      LOG.info("Table " + cfg.tableName + " is not found. Creating it");
      if (!isRealTime) {
-        // TODO - RO Table for MOR only after major compaction (UnboundedCompaction is default for now)
+        // TODO - RO Table for MOR only after major compaction (UnboundedCompaction is default
+        // for now)
        hoodieHiveClient.createTable(schema, HoodieInputFormat.class.getName(),
            MapredParquetOutputFormat.class.getName(), ParquetHiveSerDe.class.getName());
      } else {
        // Custom serde will not work with ALTER TABLE REPLACE COLUMNS
-        // https://github.com/apache/hive/blob/release-1.1.0/ql/src/java/org/apache/hadoop/hive/ql/exec/DDLTask.java#L3488
+        // https://github.com/apache/hive/blob/release-1.1.0/ql/src/java/org/apache/hadoop/hive
+        // /ql/exec/DDLTask.java#L3488
        hoodieHiveClient.createTable(schema, HoodieRealtimeInputFormat.class.getName(),
            MapredParquetOutputFormat.class.getName(), ParquetHiveSerDe.class.getName());
      }
    } else {
      // Check if the dataset schema has evolved
      Map<String, String> tableSchema = hoodieHiveClient.getTableSchema();
-      SchemaDifference schemaDiff = SchemaUtil
-          .getSchemaDifference(schema, tableSchema, cfg.partitionFields);
+      SchemaDifference schemaDiff = SchemaUtil.getSchemaDifference(schema, tableSchema,
+          cfg.partitionFields);
      if (!schemaDiff.isEmpty()) {
        LOG.info("Schema difference found for " + cfg.tableName);
        hoodieHiveClient.updateTableDefinition(schema);
@@ -156,8 +157,8 @@ public class HiveSyncTool {
  private void syncPartitions(List<String> writtenPartitionsSince) {
    try {
      List<Partition> hivePartitions = hoodieHiveClient.scanTablePartitions();
-      List<PartitionEvent> partitionEvents = hoodieHiveClient
-          .getPartitionEvents(hivePartitions, writtenPartitionsSince);
+      List<PartitionEvent> partitionEvents = hoodieHiveClient.getPartitionEvents(hivePartitions,
+          writtenPartitionsSince);
      List<String> newPartitions = filterPartitions(partitionEvents, PartitionEventType.ADD);
      LOG.info("New Partitions " + newPartitions);
      hoodieHiveClient.addPartitionsToTable(newPartitions);
@@ -165,15 +166,13 @@ public class HiveSyncTool {
      LOG.info("Changed Partitions " + updatePartitions);
      hoodieHiveClient.updatePartitionsToTable(updatePartitions);
    } catch (Exception e) {
-      throw new HoodieHiveSyncException("Failed to sync partitions for table " + cfg.tableName,
-          e);
+      throw new HoodieHiveSyncException("Failed to sync partitions for table " + cfg.tableName, e);
    }
  }

  private List<String> filterPartitions(List<PartitionEvent> events, PartitionEventType eventType) {
-    return events.stream()
-        .filter(s -> s.eventType == eventType).map(s -> s.storagePartition).collect(
-            Collectors.toList());
+    return events.stream().filter(s -> s.eventType == eventType).map(s -> s.storagePartition)
+        .collect(Collectors.toList());
  }

  public static void main(String[] args) throws Exception {
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/HoodieHiveClient.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/HoodieHiveClient.java
@@ -15,6 +15,7 @@
 *
 *
 */
+
 package com.uber.hoodie.hive;

 import com.google.common.base.Preconditions;
@@ -25,15 +26,22 @@ import com.uber.hoodie.common.model.HoodieLogFile;
 import com.uber.hoodie.common.model.HoodieTableType;
 import com.uber.hoodie.common.table.HoodieTableMetaClient;
 import com.uber.hoodie.common.table.HoodieTimeline;
-import com.uber.hoodie.common.table.log.HoodieLogFormat;
-import com.uber.hoodie.common.table.log.HoodieLogFormat.Reader;
-import com.uber.hoodie.common.table.log.block.HoodieAvroDataBlock;
-import com.uber.hoodie.common.table.log.block.HoodieLogBlock;
 import com.uber.hoodie.common.table.timeline.HoodieInstant;
 import com.uber.hoodie.common.util.FSUtils;
 import com.uber.hoodie.exception.HoodieIOException;
 import com.uber.hoodie.exception.InvalidDatasetException;
 import com.uber.hoodie.hive.util.SchemaUtil;
+import java.io.IOException;
+import java.sql.Connection;
+import java.sql.DatabaseMetaData;
+import java.sql.ResultSet;
+import java.sql.SQLException;
+import java.sql.Statement;
+import java.util.Collections;
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+import java.util.stream.Collectors;
 import org.apache.commons.dbcp.BasicDataSource;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
@@ -51,18 +59,6 @@ import parquet.hadoop.ParquetFileReader;
 import parquet.hadoop.metadata.ParquetMetadata;
 import parquet.schema.MessageType;

-import java.io.IOException;
-import java.sql.Connection;
-import java.sql.DatabaseMetaData;
-import java.sql.ResultSet;
-import java.sql.SQLException;
-import java.sql.Statement;
-import java.util.Collections;
-import java.util.List;
-import java.util.Map;
-import java.util.Optional;
-import java.util.stream.Collectors;
-
@SuppressWarnings("ConstantConditions")
 public class HoodieHiveClient {

@@ -103,16 +99,15 @@ public class HoodieHiveClient {
    }

    try {
-      this.partitionValueExtractor = (PartitionValueExtractor) Class
-          .forName(cfg.partitionValueExtractorClass).newInstance();
+      this.partitionValueExtractor = (PartitionValueExtractor) Class.forName(
+          cfg.partitionValueExtractorClass).newInstance();
    } catch (Exception e) {
      throw new HoodieHiveSyncException(
          "Failed to initialize PartitionValueExtractor class " + cfg.partitionValueExtractorClass,
          e);
    }

-    activeTimeline = metaClient.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    activeTimeline = metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
  }

  public HoodieTimeline getActiveTimeline() {
@@ -207,9 +202,8 @@ public class HoodieHiveClient {
    for (Partition tablePartition : tablePartitions) {
      List<String> hivePartitionValues = tablePartition.getValues();
      Collections.sort(hivePartitionValues);
-      String fullTablePartitionPath = Path
-          .getPathWithoutSchemeAndAuthority(new Path(tablePartition.getSd().getLocation())).toUri()
-          .getPath();
+      String fullTablePartitionPath = Path.getPathWithoutSchemeAndAuthority(
+          new Path(tablePartition.getSd().getLocation())).toUri().getPath();
      paths.put(String.join(", ", hivePartitionValues), fullTablePartitionPath);
    }

@@ -235,8 +229,7 @@ public class HoodieHiveClient {
   * Scan table partitions
   */
  List<Partition> scanTablePartitions() throws TException {
-    return client
-        .listPartitions(syncConfig.databaseName, syncConfig.tableName, (short) -1);
+    return client.listPartitions(syncConfig.databaseName, syncConfig.tableName, (short) -1);
  }

  void updateTableDefinition(MessageType newSchema) {
@@ -245,9 +238,10 @@ public class HoodieHiveClient {
      // Cascade clause should not be present for non-partitioned tables
      String cascadeClause = syncConfig.partitionFields.size() > 0 ? " cascade" : "";
      StringBuilder sqlBuilder = new StringBuilder("ALTER TABLE ").append("`")
-          .append(syncConfig.databaseName).append(".").append(syncConfig.tableName).append("`")
-          .append(" REPLACE COLUMNS(")
-          .append(newSchemaStr).append(" )").append(cascadeClause);
+          .append(syncConfig.databaseName).append(".")
+          .append(syncConfig.tableName).append("`")
+          .append(" REPLACE COLUMNS(").append(newSchemaStr).append(" )")
+          .append(cascadeClause);
      LOG.info("Creating table with " + sqlBuilder);
      updateHiveSQL(sqlBuilder.toString());
    } catch (IOException e) {
@@ -255,8 +249,8 @@ public class HoodieHiveClient {
    }
  }

-  void createTable(MessageType storageSchema,
-      String inputFormatClass, String outputFormatClass, String serdeClass) {
+  void createTable(MessageType storageSchema, String inputFormatClass, String outputFormatClass,
+      String serdeClass) {
    try {
      String createSQLQuery = SchemaUtil
          .generateCreateDDL(storageSchema, syncConfig, inputFormatClass,
@@ -289,8 +283,8 @@ public class HoodieHiveClient {
      }
      return schema;
    } catch (SQLException e) {
-      throw new HoodieHiveSyncException(
-          "Failed to get table schema for " + syncConfig.tableName, e);
+      throw new HoodieHiveSyncException("Failed to get table schema for " + syncConfig.tableName,
+          e);
    } finally {
      closeQuietly(result, null);
    }
@@ -308,49 +302,47 @@ public class HoodieHiveClient {
    try {
      switch (tableType) {
        case COPY_ON_WRITE:
-          // If this is COW, get the last commit and read the schema from a file written in the last commit
-          HoodieInstant lastCommit = activeTimeline.lastInstant()
-              .orElseThrow(() -> new InvalidDatasetException(syncConfig.basePath));
-          HoodieCommitMetadata commitMetadata = HoodieCommitMetadata
-              .fromBytes(activeTimeline.getInstantDetails(lastCommit).get());
+          // If this is COW, get the last commit and read the schema from a file written in the
+          // last commit
+          HoodieInstant lastCommit = activeTimeline.lastInstant().orElseThrow(
+              () -> new InvalidDatasetException(syncConfig.basePath));
+          HoodieCommitMetadata commitMetadata = HoodieCommitMetadata.fromBytes(
+              activeTimeline.getInstantDetails(lastCommit).get());
          String filePath = commitMetadata.getFileIdAndFullPaths(metaClient.getBasePath()).values()
-              .stream().findAny()
-              .orElseThrow(() -> new IllegalArgumentException(
+              .stream().findAny().orElseThrow(() -> new IllegalArgumentException(
                  "Could not find any data file written for commit " + lastCommit
                      + ", could not get schema for dataset " + metaClient.getBasePath()));
          return readSchemaFromDataFile(new Path(filePath));
        case MERGE_ON_READ:
-          // If this is MOR, depending on whether the latest commit is a delta commit or compaction commit
+          // If this is MOR, depending on whether the latest commit is a delta commit or
+          // compaction commit
          // Get a datafile written and get the schema from that file
          Optional<HoodieInstant> lastCompactionCommit = metaClient.getActiveTimeline()
-              .getCommitTimeline().filterCompletedInstants().lastInstant();
+              .getCommitTimeline()
+              .filterCompletedInstants()
+              .lastInstant();
          LOG.info("Found the last compaction commit as " + lastCompactionCommit);

          Optional<HoodieInstant> lastDeltaCommit;
          if (lastCompactionCommit.isPresent()) {
-            lastDeltaCommit = metaClient.getActiveTimeline()
-                .getDeltaCommitTimeline()
+            lastDeltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline()
                .filterCompletedInstants()
-                .findInstantsAfter(lastCompactionCommit.get().getTimestamp(), Integer.MAX_VALUE)
-                .lastInstant();
+                .findInstantsAfter(lastCompactionCommit.get().getTimestamp(),
+                    Integer.MAX_VALUE).lastInstant();
          } else {
-            lastDeltaCommit = metaClient.getActiveTimeline()
-                    .getDeltaCommitTimeline()
-                    .filterCompletedInstants()
-                    .lastInstant();
+            lastDeltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline()
+                .filterCompletedInstants().lastInstant();
          }
-          LOG.info("Found the last delta commit "
-              + lastDeltaCommit);
+          LOG.info("Found the last delta commit " + lastDeltaCommit);

          if (lastDeltaCommit.isPresent()) {
            HoodieInstant lastDeltaInstant = lastDeltaCommit.get();
            // read from the log file wrote
-            commitMetadata = HoodieCommitMetadata
-                .fromBytes(activeTimeline.getInstantDetails(lastDeltaInstant).get());
+            commitMetadata = HoodieCommitMetadata.fromBytes(
+                activeTimeline.getInstantDetails(lastDeltaInstant).get());
            filePath = commitMetadata.getFileIdAndFullPaths(metaClient.getBasePath()).values()
-                .stream().filter(s -> s.contains(
-                    HoodieLogFile.DELTA_EXTENSION)).findAny()
-                .orElseThrow(() -> new IllegalArgumentException(
+                .stream().filter(s -> s.contains(HoodieLogFile.DELTA_EXTENSION))
+                .findAny().orElseThrow(() -> new IllegalArgumentException(
                    "Could not find any data file written for commit " + lastDeltaInstant
                        + ", could not get schema for dataset " + metaClient.getBasePath()));
            return readSchemaFromLogFile(lastCompactionCommit, new Path(filePath));
@@ -362,8 +354,8 @@ public class HoodieHiveClient {
          throw new InvalidDatasetException(syncConfig.basePath);
      }
    } catch (IOException e) {
-      throw new HoodieHiveSyncException(
-          "Failed to get dataset schema for " + syncConfig.tableName, e);
+      throw new HoodieHiveSyncException("Failed to get dataset schema for " + syncConfig.tableName,
+          e);
    }
  }

@@ -379,11 +371,10 @@ public class HoodieHiveClient {
                + syncConfig.basePath));

    // Read from the compacted file wrote
-    HoodieCommitMetadata compactionMetadata = HoodieCommitMetadata
-        .fromBytes(activeTimeline.getInstantDetails(lastCompactionCommit).get());
+    HoodieCommitMetadata compactionMetadata = HoodieCommitMetadata.fromBytes(
+        activeTimeline.getInstantDetails(lastCompactionCommit).get());
    String filePath = compactionMetadata.getFileIdAndFullPaths(metaClient.getBasePath()).values()
-        .stream().findAny()
-        .orElseThrow(() -> new IllegalArgumentException(
+        .stream().findAny().orElseThrow(() -> new IllegalArgumentException(
            "Could not find any data file written for compaction " + lastCompactionCommit
                + ", could not get schema for dataset " + metaClient.getBasePath()));
    return readSchemaFromDataFile(new Path(filePath));
@@ -411,12 +402,10 @@ public class HoodieHiveClient {
    LOG.info("Reading schema from " + parquetFilePath);
    if (!fs.exists(parquetFilePath)) {
      throw new IllegalArgumentException(
-          "Failed to read schema from data file " + parquetFilePath
-              + ". File does not exist.");
+          "Failed to read schema from data file " + parquetFilePath + ". File does not exist.");
    }
-    ParquetMetadata fileFooter =
-        ParquetFileReader
-            .readFooter(fs.getConf(), parquetFilePath, ParquetMetadataConverter.NO_FILTER);
+    ParquetMetadata fileFooter = ParquetFileReader.readFooter(fs.getConf(), parquetFilePath,
+        ParquetMetadataConverter.NO_FILTER);
    return fileFooter.getFileMetaData().getSchema();
  }

@@ -427,8 +416,8 @@ public class HoodieHiveClient {
    try {
      return client.tableExists(syncConfig.databaseName, syncConfig.tableName);
    } catch (TException e) {
-      throw new HoodieHiveSyncException(
-          "Failed to check if table exists " + syncConfig.tableName, e);
+      throw new HoodieHiveSyncException("Failed to check if table exists " + syncConfig.tableName,
+          e);
    }
  }

@@ -511,8 +500,8 @@ public class HoodieHiveClient {
    // Get the last commit time from the TBLproperties
    try {
      Table database = client.getTable(syncConfig.databaseName, syncConfig.tableName);
-      return Optional
-          .ofNullable(database.getParameters().getOrDefault(HOODIE_LAST_COMMIT_TIME_SYNC, null));
+      return Optional.ofNullable(
+          database.getParameters().getOrDefault(HOODIE_LAST_COMMIT_TIME_SYNC, null));
    } catch (Exception e) {
      throw new HoodieHiveSyncException(
          "Failed to get the last commit time synced from the database", e);
@@ -537,8 +526,8 @@ public class HoodieHiveClient {
    if (!lastCommitTimeSynced.isPresent()) {
      LOG.info("Last commit time synced is not known, listing all partitions");
      try {
-        return FSUtils
-            .getAllPartitionPaths(fs, syncConfig.basePath, syncConfig.assumeDatePartitioning);
+        return FSUtils.getAllPartitionPaths(fs, syncConfig.basePath,
+            syncConfig.assumeDatePartitioning);
      } catch (IOException e) {
        throw new HoodieIOException("Failed to list all partitions in " + syncConfig.basePath, e);
      }
@@ -546,8 +535,8 @@ public class HoodieHiveClient {
      LOG.info("Last commit time synced is " + lastCommitTimeSynced.get()
          + ", Getting commits since then");

-      HoodieTimeline timelineToSync = activeTimeline
-          .findInstantsAfter(lastCommitTimeSynced.get(), Integer.MAX_VALUE);
+      HoodieTimeline timelineToSync = activeTimeline.findInstantsAfter(lastCommitTimeSynced.get(),
+          Integer.MAX_VALUE);
      return timelineToSync.getInstants().map(s -> {
        try {
          return HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(s).get());
@@ -579,13 +568,15 @@ public class HoodieHiveClient {
   */
  static class PartitionEvent {

-    public enum PartitionEventType {ADD, UPDATE}
+    public enum PartitionEventType {
+      ADD,
+      UPDATE
+    }

    PartitionEventType eventType;
    String storagePartition;

-    PartitionEvent(
-        PartitionEventType eventType, String storagePartition) {
+    PartitionEvent(PartitionEventType eventType, String storagePartition) {
      this.eventType = eventType;
      this.storagePartition = storagePartition;
    }
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/PartitionValueExtractor.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/PartitionValueExtractor.java
@@ -24,8 +24,9 @@ import java.util.List;
 * HDFS Path contain hive partition values for the keys it is partitioned on. This mapping is not
 * straight forward and requires a pluggable implementation to extract the partition value from HDFS
 * path.
- *
- * e.g. Hive table partitioned by datestr=yyyy-mm-dd and hdfs path /app/hoodie/dataset1/YYYY=[yyyy]/MM=[mm]/DD=[dd]
+ * <p>
+ * e.g. Hive table partitioned by datestr=yyyy-mm-dd and hdfs path
+ * /app/hoodie/dataset1/YYYY=[yyyy]/MM=[mm]/DD=[dd]
 */
 public interface PartitionValueExtractor {

--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/SlashEncodedDayPartitionValueExtractor.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/SlashEncodedDayPartitionValueExtractor.java
@@ -28,7 +28,7 @@ import org.joda.time.format.DateTimeFormatter;
 * HDFS Path contain hive partition values for the keys it is partitioned on. This mapping is not
 * straight forward and requires a pluggable implementation to extract the partition value from HDFS
 * path.
- *
+ * <p>
 * This implementation extracts datestr=yyyy-mm-dd from path of type /yyyy/mm/dd
 */
 public class SlashEncodedDayPartitionValueExtractor implements PartitionValueExtractor {
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/util/ColumnNameXLator.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/util/ColumnNameXLator.java
@@ -26,9 +26,9 @@ public class ColumnNameXLator {

  public static String translateNestedColumn(String colName) {
    Map.Entry entry;
-    for (Iterator i$ = xformMap.entrySet().iterator(); i$.hasNext();
+    for (Iterator ic = xformMap.entrySet().iterator(); ic.hasNext();
        colName = colName.replaceAll((String) entry.getKey(), (String) entry.getValue())) {
-      entry = (Map.Entry) i$.next();
+      entry = (Map.Entry) ic.next();
    }

    return colName;
--- a/hoodie-hive/src/main/java/com/uber/hoodie/hive/util/SchemaUtil.java
+++ b/hoodie-hive/src/main/java/com/uber/hoodie/hive/util/SchemaUtil.java
@@ -23,14 +23,12 @@ import com.uber.hoodie.common.table.log.HoodieLogFormat;
 import com.uber.hoodie.common.table.log.HoodieLogFormat.Reader;
 import com.uber.hoodie.common.table.log.block.HoodieAvroDataBlock;
 import com.uber.hoodie.common.table.log.block.HoodieLogBlock;
-import com.uber.hoodie.common.table.timeline.HoodieInstant;
 import com.uber.hoodie.hive.HiveSyncConfig;
 import com.uber.hoodie.hive.HoodieHiveSyncException;
 import com.uber.hoodie.hive.SchemaDifference;
 import java.io.IOException;
 import java.util.List;
 import java.util.Map;
-import java.util.Optional;
 import java.util.Set;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
@@ -48,7 +46,7 @@ import parquet.schema.Type;
 */
 public class SchemaUtil {

-  private static Logger LOG = LoggerFactory.getLogger(SchemaUtil.class);
+  private static final Logger LOG = LoggerFactory.getLogger(SchemaUtil.class);

  /**
   * Get the schema difference between the storage schema and hive table schema
@@ -59,19 +57,19 @@ public class SchemaUtil {
    try {
      newTableSchema = convertParquetSchemaToHiveSchema(storageSchema);
    } catch (IOException e) {
-      throw new HoodieHiveSyncException("Failed to convert parquet schema to hive schema",
-          e);
+      throw new HoodieHiveSyncException("Failed to convert parquet schema to hive schema", e);
    }
    LOG.info("Getting schema difference for " + tableSchema + "\r\n\r\n" + newTableSchema);
-    SchemaDifference.Builder schemaDiffBuilder =
-        SchemaDifference.newBuilder(storageSchema, tableSchema);
+    SchemaDifference.Builder schemaDiffBuilder = SchemaDifference
+        .newBuilder(storageSchema, tableSchema);
    Set<String> tableColumns = Sets.newHashSet();

    for (Map.Entry<String, String> field : tableSchema.entrySet()) {
      String fieldName = field.getKey().toLowerCase();
      String tickSurroundedFieldName = tickSurround(fieldName);
      if (!isFieldExistsInSchema(newTableSchema, tickSurroundedFieldName) && !partitionKeys
-          .contains(fieldName)) {
+          .contains(
+              fieldName)) {
        schemaDiffBuilder.deleteTableColumn(fieldName);
      } else {
        // check type
@@ -82,8 +80,8 @@ public class SchemaUtil {
            continue;
          }
          // We will log this and continue. Hive schema is a superset of all parquet schemas
-          LOG.warn("Ignoring table column " + fieldName
-              + " as its not present in the parquet schema");
+          LOG.warn(
+              "Ignoring table column " + fieldName + " as its not present in the parquet schema");
          continue;
        }
        tableColumnType = tableColumnType.replaceAll("\\s+", "");
@@ -93,11 +91,12 @@ public class SchemaUtil {
        expectedType = expectedType.replaceAll("`", "");

        if (!tableColumnType.equalsIgnoreCase(expectedType)) {
-          // check for incremental datasets, the schema type change is allowed as per evolution rules
+          // check for incremental datasets, the schema type change is allowed as per evolution
+          // rules
          if (!isSchemaTypeUpdateAllowed(tableColumnType, expectedType)) {
            throw new HoodieHiveSyncException(
-                "Could not convert field Type from " + tableColumnType + " to "
-                    + expectedType + " for field " + fieldName);
+                "Could not convert field Type from " + tableColumnType + " to " + expectedType
+                    + " for field " + fieldName);
          }
          schemaDiffBuilder.updateTableColumn(fieldName,
              getExpectedType(newTableSchema, tickSurroundedFieldName));
@@ -169,21 +168,19 @@ public class SchemaUtil {
  private static String convertField(final Type parquetType) {
    StringBuilder field = new StringBuilder();
    if (parquetType.isPrimitive()) {
-      final PrimitiveType.PrimitiveTypeName parquetPrimitiveTypeName =
-          parquetType.asPrimitiveType().getPrimitiveTypeName();
+      final PrimitiveType.PrimitiveTypeName parquetPrimitiveTypeName = parquetType.asPrimitiveType()
+          .getPrimitiveTypeName();
      final OriginalType originalType = parquetType.getOriginalType();
      if (originalType == OriginalType.DECIMAL) {
-        final DecimalMetadata decimalMetadata =
-            parquetType.asPrimitiveType().getDecimalMetadata();
-        return field.append("DECIMAL(").append(decimalMetadata.getPrecision()).
-            append(" , ").append(decimalMetadata.getScale()).append(")").toString();
+        final DecimalMetadata decimalMetadata = parquetType.asPrimitiveType().getDecimalMetadata();
+        return field.append("DECIMAL(").append(decimalMetadata.getPrecision()).append(" , ")
+            .append(decimalMetadata.getScale()).append(")").toString();
      }
      // TODO - fix the method naming here
      return parquetPrimitiveTypeName
          .convert(new PrimitiveType.PrimitiveTypeNameConverter<String, RuntimeException>() {
            @Override
-            public String convertBOOLEAN(
-                PrimitiveType.PrimitiveTypeName primitiveTypeName) {
+            public String convertBOOLEAN(PrimitiveType.PrimitiveTypeName primitiveTypeName) {
              return "boolean";
            }

@@ -220,8 +217,7 @@ public class SchemaUtil {

            @Override
            public String convertBINARY(PrimitiveType.PrimitiveTypeName primitiveTypeName) {
-              if (originalType == OriginalType.UTF8
-                  || originalType == OriginalType.ENUM) {
+              if (originalType == OriginalType.UTF8 || originalType == OriginalType.ENUM) {
                return "string";
              } else {
                return "binary";
@@ -235,33 +231,28 @@ public class SchemaUtil {
        switch (originalType) {
          case LIST:
            if (parquetGroupType.getFieldCount() != 1) {
-              throw new UnsupportedOperationException(
-                  "Invalid list type " + parquetGroupType);
+              throw new UnsupportedOperationException("Invalid list type " + parquetGroupType);
            }
            Type elementType = parquetGroupType.getType(0);
            if (!elementType.isRepetition(Type.Repetition.REPEATED)) {
-              throw new UnsupportedOperationException(
-                  "Invalid list type " + parquetGroupType);
+              throw new UnsupportedOperationException("Invalid list type " + parquetGroupType);
            }
            return createHiveArray(elementType, parquetGroupType.getName());
          case MAP:
            if (parquetGroupType.getFieldCount() != 1 || parquetGroupType.getType(0)
                .isPrimitive()) {
-              throw new UnsupportedOperationException(
-                  "Invalid map type " + parquetGroupType);
+              throw new UnsupportedOperationException("Invalid map type " + parquetGroupType);
            }
            GroupType mapKeyValType = parquetGroupType.getType(0).asGroupType();
-            if (!mapKeyValType.isRepetition(Type.Repetition.REPEATED) ||
-                !mapKeyValType.getOriginalType().equals(OriginalType.MAP_KEY_VALUE) ||
-                mapKeyValType.getFieldCount() != 2) {
-              throw new UnsupportedOperationException(
-                  "Invalid map type " + parquetGroupType);
+            if (!mapKeyValType.isRepetition(Type.Repetition.REPEATED)
+                || !mapKeyValType.getOriginalType().equals(OriginalType.MAP_KEY_VALUE)
+                || mapKeyValType.getFieldCount() != 2) {
+              throw new UnsupportedOperationException("Invalid map type " + parquetGroupType);
            }
            Type keyType = mapKeyValType.getType(0);
-            if (!keyType.isPrimitive() ||
-                !keyType.asPrimitiveType().getPrimitiveTypeName()
-                    .equals(PrimitiveType.PrimitiveTypeName.BINARY) ||
-                !keyType.getOriginalType().equals(OriginalType.UTF8)) {
+            if (!keyType.isPrimitive() || !keyType.asPrimitiveType().getPrimitiveTypeName()
+                .equals(PrimitiveType.PrimitiveTypeName.BINARY)
+                || !keyType.getOriginalType().equals(OriginalType.UTF8)) {
              throw new UnsupportedOperationException(
                  "Map key type must be binary (UTF8): " + keyType);
            }
@@ -277,8 +268,7 @@ public class SchemaUtil {
            // MAP. Hence, PARQUET-113
            // dropped the requirement for having MAP_KEY_VALUE.
          default:
-            throw new UnsupportedOperationException(
-                "Cannot convert Parquet type " + parquetType);
+            throw new UnsupportedOperationException("Cannot convert Parquet type " + parquetType);
        }
      } else {
        // if no original type then it's a record
@@ -306,7 +296,8 @@ public class SchemaUtil {
    // ", "
    struct.append(">");
    String finalStr = struct.toString();
-    // Struct cannot have - in them. userstore_udr_entities has uuid in struct. This breaks the schema.
+    // Struct cannot have - in them. userstore_udr_entities has uuid in struct. This breaks the
+    // schema.
    // HDrone sync should not fail because of this.
    finalStr = finalStr.replaceAll("-", "_");
    return finalStr;
@@ -362,8 +353,8 @@ public class SchemaUtil {
  }

  public static boolean isSchemaTypeUpdateAllowed(String prevType, String newType) {
-    if (prevType == null || prevType.trim().isEmpty() ||
-        newType == null || newType.trim().isEmpty()) {
+    if (prevType == null || prevType.trim().isEmpty() || newType == null || newType.trim()
+        .isEmpty()) {
      return false;
    }
    prevType = prevType.toLowerCase();
@@ -392,9 +383,8 @@ public class SchemaUtil {
    return columns.toString();
  }

-  public static String generateCreateDDL(MessageType storageSchema,
-      HiveSyncConfig config, String inputFormatClass,
-      String outputFormatClass, String serdeClass) throws IOException {
+  public static String generateCreateDDL(MessageType storageSchema, HiveSyncConfig config,
+      String inputFormatClass, String outputFormatClass, String serdeClass) throws IOException {
    Map<String, String> hiveSchema = convertParquetSchemaToHiveSchema(storageSchema);
    String columns = generateSchemaString(storageSchema);

@@ -422,7 +412,8 @@ public class SchemaUtil {
      return hiveSchema.get(partitionKey);
    }
    // Default the unknown partition fields to be String
-    // TODO - all partition fields should be part of the schema. datestr is treated as special. Dont do that
+    // TODO - all partition fields should be part of the schema. datestr is treated as special.
+    // Dont do that
    return "String";
  }

@@ -430,8 +421,7 @@ public class SchemaUtil {
   * Read the schema from the log file on path
   */
  @SuppressWarnings("OptionalUsedAsFieldOrParameterType")
-  public static MessageType readSchemaFromLogFile(FileSystem fs,
-      Path path) throws IOException {
+  public static MessageType readSchemaFromLogFile(FileSystem fs, Path path) throws IOException {
    Reader reader = HoodieLogFormat.newReader(fs, new HoodieLogFile(path), null);
    HoodieAvroDataBlock lastBlock = null;
    while (reader.hasNext()) {