CodeStyle formatting to conform to basic Checkstyle rules.

The code-style rules follow google style with some changes: 1. Increase line length from 100 to 120 2. Disable JavaDoc related checkstyles as this needs more manual work. Both source and test code are checked for code-style
2018-03-20 16:29:20 -07:00
parent 987f5d6b96
commit 788e4f2d2e
200 changed files with 6209 additions and 5975 deletions
--- a/docs/dev_setup.md
+++ b/docs/dev_setup.md
@@ -7,8 +7,7 @@ permalink: dev_setup.html

 ### Code Style

- We have embraced the [Google Java code style](https://google.github.io/styleguide/javaguide.html). Please setup your IDE accordingly with style files from [here](https://github.com/google/styleguide/blob/gh-pages/intellij-java-google-style.xml)
- Also recommend setting up the [Save Action Plugin](https://plugins.jetbrains.com/plugin/7642-save-actions) to auto format & organize imports on save.
-
-
-
+ We have embraced the code style largely based on [google format](https://google.github.io/styleguide/javaguide.html).
+ Please setup your IDE with style files from [here](../style/)
+ We also recommend setting up the [Save Action Plugin](https://plugins.jetbrains.com/plugin/7642-save-actions) to auto format & organize imports on save.
+ The Maven Compilation life-cycle will fail if there are checkstyle violations.
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/HoodiePrompt.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/HoodiePrompt.java
@@ -35,11 +35,11 @@ public class HoodiePrompt extends DefaultPromptProvider {
        case DATASET:
          return "hoodie:" + tableName + "->";
        case SYNC:
-          return "hoodie:" + tableName + " <==> "
-              + HoodieCLI.syncTableMetadata.getTableConfig().getTableName() + "->";
-      }
+          return "hoodie:" + tableName + " <==> " + HoodieCLI.syncTableMetadata.getTableConfig().getTableName() + "->";
+        default:
          return "hoodie:" + tableName + "->";
      }
+    }
    return "hoodie->";
  }

--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/HoodieSplashScreen.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/HoodieSplashScreen.java
@@ -24,22 +24,18 @@ import org.springframework.stereotype.Component;

@Component
@Order(Ordered.HIGHEST_PRECEDENCE)
-public class HoodieSplashScreen
-    extends DefaultBannerProvider {
+public class HoodieSplashScreen extends DefaultBannerProvider {

-  private static String screen =
-      "============================================" + OsUtils.LINE_SEPARATOR +
-          "*                                          *" + OsUtils.LINE_SEPARATOR +
-          "*     _    _                 _ _           *" + OsUtils.LINE_SEPARATOR +
-          "*    | |  | |               | (_)          *" + OsUtils.LINE_SEPARATOR +
-          "*    | |__| | ___   ___   __| |_  ___      *" + OsUtils.LINE_SEPARATOR +
-          "*    |  __  |/ _ \\ / _ \\ / _` | |/ _ \\     *" +
-          OsUtils.LINE_SEPARATOR +
-          "*    | |  | | (_) | (_) | (_| | |  __/     *" + OsUtils.LINE_SEPARATOR +
-          "*    |_|  |_|\\___/ \\___/ \\__,_|_|\\___|     *" +
-          OsUtils.LINE_SEPARATOR +
-          "*                                          *" + OsUtils.LINE_SEPARATOR +
-          "============================================" + OsUtils.LINE_SEPARATOR;
+  private static String screen = "============================================" + OsUtils.LINE_SEPARATOR
+      + "*                                          *" + OsUtils.LINE_SEPARATOR
+      + "*     _    _                 _ _           *" + OsUtils.LINE_SEPARATOR
+      + "*    | |  | |               | (_)          *" + OsUtils.LINE_SEPARATOR
+      + "*    | |__| | ___   ___   __| |_  ___      *" + OsUtils.LINE_SEPARATOR
+      + "*    |  __  |/ _ \\ / _ \\ / _` | |/ _ \\     *" + OsUtils.LINE_SEPARATOR
+      + "*    | |  | | (_) | (_) | (_| | |  __/     *" + OsUtils.LINE_SEPARATOR
+      + "*    |_|  |_|\\___/ \\___/ \\__,_|_|\\___|     *" + OsUtils.LINE_SEPARATOR
+      + "*                                          *" + OsUtils.LINE_SEPARATOR
+      + "============================================" + OsUtils.LINE_SEPARATOR;

  public String getBanner() {
    return screen;
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/Main.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/Main.java
@@ -22,8 +22,7 @@ import org.springframework.shell.Bootstrap;
 public class Main {

  /**
-   * Main class that delegates to Spring Shell's Bootstrap class in order to simplify debugging
-   * inside an IDE
+   * Main class that delegates to Spring Shell's Bootstrap class in order to simplify debugging inside an IDE
   */
  public static void main(String[] args) throws IOException {
    Bootstrap.main(args);
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/ArchivedCommitsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/ArchivedCommitsCommand.java
@@ -47,13 +47,11 @@ public class ArchivedCommitsCommand implements CommandMarker {
  }

  @CliCommand(value = "show archived commits", help = "Read commits from archived files and show details")
-  public String showCommits(
-      @CliOption(key = {
-          "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10")
-      final Integer limit) throws IOException {
+  public String showCommits(@CliOption(key = {
+      "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10") final Integer limit)
+      throws IOException {

-    System.out
-        .println("===============> Showing only " + limit + " archived commits <===============");
+    System.out.println("===============> Showing only " + limit + " archived commits <===============");
    String basePath = HoodieCLI.tableMetadata.getBasePath();
    FileStatus[] fsStatuses = FSUtils.getFs(basePath, HoodieCLI.conf)
        .globStatus(new Path(basePath + "/.hoodie/.commits_.archive*"));
@@ -61,8 +59,7 @@ public class ArchivedCommitsCommand implements CommandMarker {
    int commits = 0;
    for (FileStatus fs : fsStatuses) {
      //read the archived file
-      HoodieLogFormat.Reader reader = HoodieLogFormat
-          .newReader(FSUtils.getFs(basePath, HoodieCLI.conf),
+      HoodieLogFormat.Reader reader = HoodieLogFormat.newReader(FSUtils.getFs(basePath, HoodieCLI.conf),
          new HoodieLogFile(fs.getPath()), HoodieArchivedMetaEntry.getClassSchema());

      List<IndexedRecord> readRecords = new ArrayList<>();
@@ -76,15 +73,14 @@ public class ArchivedCommitsCommand implements CommandMarker {
        }
        commits++;
      }
-      List<String[]> readCommits = readRecords.stream().map(r -> (GenericRecord) r)
-          .map(r -> readCommit(r)).collect(Collectors.toList());
+      List<String[]> readCommits = readRecords.stream().map(r -> (GenericRecord) r).map(r -> readCommit(r))
+          .collect(Collectors.toList());
      allCommits.addAll(readCommits);
      if (commits == limit) {
        break;
      }
    }
-    return HoodiePrintHelper.print(
-        new String[]{"CommitTime", "CommitType", "CommitDetails"},
+    return HoodiePrintHelper.print(new String[] {"CommitTime", "CommitType", "CommitDetails"},
        allCommits.toArray(new String[allCommits.size()][]));
  }

@@ -122,6 +118,8 @@ public class ArchivedCommitsCommand implements CommandMarker {
          commitDetails.add(record.get("hoodieSavePointMetadata").toString());
          break;
        }
+        default:
+          return commitDetails.toArray(new String[commitDetails.size()]);
      }
    } catch (Exception e) {
      e.printStackTrace();
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/CleansCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/CleansCommand.java
@@ -13,6 +13,7 @@
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
+
 package com.uber.hoodie.cli.commands;

 import com.uber.hoodie.avro.model.HoodieCleanMetadata;
@@ -63,42 +64,37 @@ public class CleansCommand implements CommandMarker {
    Collections.reverse(cleans);
    for (int i = 0; i < cleans.size(); i++) {
      HoodieInstant clean = cleans.get(i);
-      HoodieCleanMetadata cleanMetadata =
-          AvroUtils.deserializeHoodieCleanMetadata(timeline.getInstantDetails(clean).get());
+      HoodieCleanMetadata cleanMetadata = AvroUtils
+          .deserializeHoodieCleanMetadata(timeline.getInstantDetails(clean).get());
      rows[i] = new String[] {clean.getTimestamp(), cleanMetadata.getEarliestCommitToRetain(),
-          String.valueOf(cleanMetadata.getTotalFilesDeleted()),
-          String.valueOf(cleanMetadata.getTimeTakenInMillis())};
+          String.valueOf(cleanMetadata.getTotalFilesDeleted()), String.valueOf(cleanMetadata.getTimeTakenInMillis())};
    }
-    return HoodiePrintHelper.print(
-        new String[]{"CleanTime", "EarliestCommandRetained", "Total Files Deleted",
-            "Total Time Taken"}, rows);
+    return HoodiePrintHelper
+        .print(new String[] {"CleanTime", "EarliestCommandRetained", "Total Files Deleted", "Total Time Taken"},
+            rows);
  }

  @CliCommand(value = "cleans refresh", help = "Refresh the commits")
  public String refreshCleans() throws IOException {
-    HoodieTableMetaClient metadata =
-        new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
+    HoodieTableMetaClient metadata = new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
    HoodieCLI.setTableMetadata(metadata);
    return "Metadata for table " + metadata.getTableConfig().getTableName() + " refreshed.";
  }

  @CliCommand(value = "clean showpartitions", help = "Show partition level details of a clean")
-  public String showCleanPartitions(
-      @CliOption(key = {"clean"}, help = "clean to show")
-      final String commitTime) throws Exception {
+  public String showCleanPartitions(@CliOption(key = {"clean"}, help = "clean to show") final String commitTime)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
    HoodieTimeline timeline = activeTimeline.getCleanerTimeline().filterCompletedInstants();
-    HoodieInstant cleanInstant =
-        new HoodieInstant(false, HoodieTimeline.CLEAN_ACTION, commitTime);
+    HoodieInstant cleanInstant = new HoodieInstant(false, HoodieTimeline.CLEAN_ACTION, commitTime);

    if (!timeline.containsInstant(cleanInstant)) {
      return "Clean " + commitTime + " not found in metadata " + timeline;
    }
-    HoodieCleanMetadata cleanMetadata =
-        AvroUtils.deserializeHoodieCleanMetadata(timeline.getInstantDetails(cleanInstant).get());
+    HoodieCleanMetadata cleanMetadata = AvroUtils.deserializeHoodieCleanMetadata(
+        timeline.getInstantDetails(cleanInstant).get());
    List<String[]> rows = new ArrayList<>();
-    for (Map.Entry<String, HoodieCleanPartitionMetadata> entry : cleanMetadata
-        .getPartitionMetadata().entrySet()) {
+    for (Map.Entry<String, HoodieCleanPartitionMetadata> entry : cleanMetadata.getPartitionMetadata().entrySet()) {
      String path = entry.getKey();
      HoodieCleanPartitionMetadata stats = entry.getValue();
      String policy = stats.getPolicy();
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/CommitsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/CommitsCommand.java
@@ -64,20 +64,17 @@ public class CommitsCommand implements CommandMarker {
  }

  @CliCommand(value = "commits show", help = "Show the commits")
-  public String showCommits(
-      @CliOption(key = {
-          "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10")
-      final Integer limit) throws IOException {
+  public String showCommits(@CliOption(key = {
+      "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10") final Integer limit)
+      throws IOException {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
-    HoodieTimeline timeline = activeTimeline.getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline timeline = activeTimeline.getCommitsTimeline().filterCompletedInstants();
    List<HoodieInstant> commits = timeline.getInstants().collect(Collectors.toList());
    String[][] rows = new String[commits.size()][];
    Collections.reverse(commits);
    for (int i = 0; i < commits.size(); i++) {
      HoodieInstant commit = commits.get(i);
-      HoodieCommitMetadata commitMetadata =
-          HoodieCommitMetadata.fromBytes(timeline.getInstantDetails(commit).get());
+      HoodieCommitMetadata commitMetadata = HoodieCommitMetadata.fromBytes(timeline.getInstantDetails(commit).get());
      rows[i] = new String[] {commit.getTimestamp(),
          NumericUtils.humanReadableByteCount(commitMetadata.fetchTotalBytesWritten()),
          String.valueOf(commitMetadata.fetchTotalFilesInsert()),
@@ -88,39 +85,32 @@ public class CommitsCommand implements CommandMarker {
          String.valueOf(commitMetadata.fetchTotalWriteErrors())};
    }
    return HoodiePrintHelper.print(
-        new String[]{"CommitTime", "Total Written (B)", "Total Files Added",
-            "Total Files Updated", "Total Partitions Written", "Total Records Written",
-            "Total Update Records Written", "Total Errors"}, rows);
+        new String[] {"CommitTime", "Total Written (B)", "Total Files Added", "Total Files Updated",
+            "Total Partitions Written", "Total Records Written", "Total Update Records Written", "Total Errors"}, rows);
  }

  @CliCommand(value = "commits refresh", help = "Refresh the commits")
  public String refreshCommits() throws IOException {
-    HoodieTableMetaClient metadata =
-        new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
+    HoodieTableMetaClient metadata = new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
    HoodieCLI.setTableMetadata(metadata);
    return "Metadata for table " + metadata.getTableConfig().getTableName() + " refreshed.";
  }

  @CliCommand(value = "commit rollback", help = "Rollback a commit")
-  public String rollbackCommit(
-      @CliOption(key = {"commit"}, help = "Commit to rollback")
-      final String commitTime,
-      @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path")
-      final String sparkPropertiesPath) throws Exception {
+  public String rollbackCommit(@CliOption(key = {"commit"}, help = "Commit to rollback") final String commitTime,
+      @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path") final String sparkPropertiesPath)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
-    HoodieTimeline timeline = activeTimeline.getCommitsTimeline()
-        .filterCompletedInstants();
-    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION,
-        commitTime);
+    HoodieTimeline timeline = activeTimeline.getCommitsTimeline().filterCompletedInstants();
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);

    if (!timeline.containsInstant(commitInstant)) {
      return "Commit " + commitTime + " not found in Commits " + timeline;
    }

    SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
-    sparkLauncher.addAppArgs(SparkMain.SparkCommand.ROLLBACK.toString(),
-        commitTime,
-        HoodieCLI.tableMetadata.getBasePath());
+    sparkLauncher
+        .addAppArgs(SparkMain.SparkCommand.ROLLBACK.toString(), commitTime, HoodieCLI.tableMetadata.getBasePath());
    Process process = sparkLauncher.launch();
    InputStreamConsumer.captureOutput(process);
    int exitCode = process.waitFor();
@@ -133,23 +123,18 @@ public class CommitsCommand implements CommandMarker {
  }

  @CliCommand(value = "commit showpartitions", help = "Show partition level details of a commit")
-  public String showCommitPartitions(
-      @CliOption(key = {"commit"}, help = "Commit to show")
-      final String commitTime) throws Exception {
+  public String showCommitPartitions(@CliOption(key = {"commit"}, help = "Commit to show") final String commitTime)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
-    HoodieTimeline timeline = activeTimeline.getCommitsTimeline()
-        .filterCompletedInstants();
-    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION,
-        commitTime);
+    HoodieTimeline timeline = activeTimeline.getCommitsTimeline().filterCompletedInstants();
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);

    if (!timeline.containsInstant(commitInstant)) {
      return "Commit " + commitTime + " not found in Commits " + timeline;
    }
-    HoodieCommitMetadata meta =
-        HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(commitInstant).get());
+    HoodieCommitMetadata meta = HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(commitInstant).get());
    List<String[]> rows = new ArrayList<String[]>();
-    for (Map.Entry<String, List<HoodieWriteStat>> entry : meta.getPartitionToWriteStats()
-        .entrySet()) {
+    for (Map.Entry<String, List<HoodieWriteStat>> entry : meta.getPartitionToWriteStats().entrySet()) {
      String path = entry.getKey();
      List<HoodieWriteStat> stats = entry.getValue();
      long totalFilesAdded = 0;
@@ -169,50 +154,40 @@ public class CommitsCommand implements CommandMarker {
        totalBytesWritten += stat.getTotalWriteBytes();
        totalWriteErrors += stat.getTotalWriteErrors();
      }
-      rows.add(new String[]{path, String.valueOf(totalFilesAdded),
-          String.valueOf(totalFilesUpdated), String.valueOf(totalRecordsInserted),
-          String.valueOf(totalRecordsUpdated),
-          NumericUtils.humanReadableByteCount(totalBytesWritten),
-          String.valueOf(totalWriteErrors)});
+      rows.add(new String[] {path, String.valueOf(totalFilesAdded), String.valueOf(totalFilesUpdated),
+          String.valueOf(totalRecordsInserted), String.valueOf(totalRecordsUpdated),
+          NumericUtils.humanReadableByteCount(totalBytesWritten), String.valueOf(totalWriteErrors)});

    }
    return HoodiePrintHelper.print(
-        new String[]{"Partition Path", "Total Files Added", "Total Files Updated",
-            "Total Records Inserted", "Total Records Updated", "Total Bytes Written",
-            "Total Errors"}, rows.toArray(new String[rows.size()][]));
+        new String[] {"Partition Path", "Total Files Added", "Total Files Updated", "Total Records Inserted",
+            "Total Records Updated", "Total Bytes Written", "Total Errors"}, rows.toArray(new String[rows.size()][]));
  }

  @CliCommand(value = "commit showfiles", help = "Show file level details of a commit")
-  public String showCommitFiles(
-      @CliOption(key = {"commit"}, help = "Commit to show")
-      final String commitTime) throws Exception {
+  public String showCommitFiles(@CliOption(key = {"commit"}, help = "Commit to show") final String commitTime)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
-    HoodieTimeline timeline = activeTimeline.getCommitsTimeline()
-        .filterCompletedInstants();
-    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION,
-        commitTime);
+    HoodieTimeline timeline = activeTimeline.getCommitsTimeline().filterCompletedInstants();
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);

    if (!timeline.containsInstant(commitInstant)) {
      return "Commit " + commitTime + " not found in Commits " + timeline;
    }
-    HoodieCommitMetadata meta =
-        HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(commitInstant).get());
+    HoodieCommitMetadata meta = HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(commitInstant).get());
    List<String[]> rows = new ArrayList<String[]>();
-    for (Map.Entry<String, List<HoodieWriteStat>> entry : meta.getPartitionToWriteStats()
-        .entrySet()) {
+    for (Map.Entry<String, List<HoodieWriteStat>> entry : meta.getPartitionToWriteStats().entrySet()) {
      String path = entry.getKey();
      List<HoodieWriteStat> stats = entry.getValue();
      for (HoodieWriteStat stat : stats) {
-        rows.add(new String[]{path, stat.getFileId(), stat.getPrevCommit(),
-            String.valueOf(stat.getNumUpdateWrites()), String.valueOf(stat.getNumWrites()),
-            String.valueOf(stat.getTotalWriteBytes()),
+        rows.add(new String[] {path, stat.getFileId(), stat.getPrevCommit(), String.valueOf(stat.getNumUpdateWrites()),
+            String.valueOf(stat.getNumWrites()), String.valueOf(stat.getTotalWriteBytes()),
            String.valueOf(stat.getTotalWriteErrors())});
      }
    }
    return HoodiePrintHelper.print(
-        new String[]{"Partition Path", "File ID", "Previous Commit", "Total Records Updated",
-            "Total Records Written", "Total Bytes Written", "Total Errors"},
-        rows.toArray(new String[rows.size()][]));
+        new String[] {"Partition Path", "File ID", "Previous Commit", "Total Records Updated", "Total Records Written",
+            "Total Bytes Written", "Total Errors"}, rows.toArray(new String[rows.size()][]));
  }

  @CliAvailabilityIndicator({"commits compare"})
@@ -221,38 +196,30 @@ public class CommitsCommand implements CommandMarker {
  }

  @CliCommand(value = "commits compare", help = "Compare commits with another Hoodie dataset")
-  public String compareCommits(
-      @CliOption(key = {"path"}, help = "Path of the dataset to compare to")
-      final String path) throws Exception {
+  public String compareCommits(@CliOption(key = {"path"}, help = "Path of the dataset to compare to") final String path)
+      throws Exception {

    HoodieTableMetaClient target = new HoodieTableMetaClient(HoodieCLI.conf, path);
-    HoodieTimeline targetTimeline = target.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline targetTimeline = target.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
    HoodieTableMetaClient source = HoodieCLI.tableMetadata;
-    HoodieTimeline sourceTimeline = source.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline sourceTimeline = source.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
    String targetLatestCommit =
-        targetTimeline.getInstants().iterator().hasNext() ? "0"
-            : targetTimeline.lastInstant().get().getTimestamp();
+        targetTimeline.getInstants().iterator().hasNext() ? "0" : targetTimeline.lastInstant().get().getTimestamp();
    String sourceLatestCommit =
-        sourceTimeline.getInstants().iterator().hasNext() ? "0"
-            : sourceTimeline.lastInstant().get().getTimestamp();
+        sourceTimeline.getInstants().iterator().hasNext() ? "0" : sourceTimeline.lastInstant().get().getTimestamp();

-    if (sourceLatestCommit != null &&
-        HoodieTimeline
-            .compareTimestamps(targetLatestCommit, sourceLatestCommit, HoodieTimeline.GREATER)) {
+    if (sourceLatestCommit != null && HoodieTimeline.compareTimestamps(targetLatestCommit, sourceLatestCommit,
+        HoodieTimeline.GREATER)) {
      // source is behind the target
-      List<String> commitsToCatchup =
-          targetTimeline.findInstantsAfter(sourceLatestCommit, Integer.MAX_VALUE)
+      List<String> commitsToCatchup = targetTimeline.findInstantsAfter(sourceLatestCommit, Integer.MAX_VALUE)
          .getInstants().map(HoodieInstant::getTimestamp).collect(Collectors.toList());
-      return "Source " + source.getTableConfig().getTableName() + " is behind by "
-          + commitsToCatchup.size() + " commits. Commits to catch up - " + commitsToCatchup;
+      return "Source " + source.getTableConfig().getTableName() + " is behind by " + commitsToCatchup.size()
+          + " commits. Commits to catch up - " + commitsToCatchup;
    } else {
-      List<String> commitsToCatchup =
-          sourceTimeline.findInstantsAfter(targetLatestCommit, Integer.MAX_VALUE)
+      List<String> commitsToCatchup = sourceTimeline.findInstantsAfter(targetLatestCommit, Integer.MAX_VALUE)
          .getInstants().map(HoodieInstant::getTimestamp).collect(Collectors.toList());
-      return "Source " + source.getTableConfig().getTableName() + " is ahead by "
-          + commitsToCatchup.size() + " commits. Commits to catch up - " + commitsToCatchup;
+      return "Source " + source.getTableConfig().getTableName() + " is ahead by " + commitsToCatchup.size()
+          + " commits. Commits to catch up - " + commitsToCatchup;
    }
  }

@@ -262,13 +229,12 @@ public class CommitsCommand implements CommandMarker {
  }

  @CliCommand(value = "commits sync", help = "Compare commits with another Hoodie dataset")
-  public String syncCommits(
-      @CliOption(key = {"path"}, help = "Path of the dataset to compare to")
-      final String path) throws Exception {
+  public String syncCommits(@CliOption(key = {"path"}, help = "Path of the dataset to compare to") final String path)
+      throws Exception {
    HoodieCLI.syncTableMetadata = new HoodieTableMetaClient(HoodieCLI.conf, path);
    HoodieCLI.state = HoodieCLI.CLIState.SYNC;
-    return "Load sync state between " + HoodieCLI.tableMetadata.getTableConfig().getTableName()
-        + " and " + HoodieCLI.syncTableMetadata.getTableConfig().getTableName();
+    return "Load sync state between " + HoodieCLI.tableMetadata.getTableConfig().getTableName() + " and "
+        + HoodieCLI.syncTableMetadata.getTableConfig().getTableName();
  }

 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/DatasetsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/DatasetsCommand.java
@@ -29,13 +29,12 @@ public class DatasetsCommand implements CommandMarker {

  @CliCommand(value = "connect", help = "Connect to a hoodie dataset")
  public String connect(
-      @CliOption(key = {"path"}, mandatory = true, help = "Base Path of the dataset")
-      final String path) throws IOException {
+      @CliOption(key = {"path"}, mandatory = true, help = "Base Path of the dataset") final String path)
+      throws IOException {
    boolean initialized = HoodieCLI.initConf();
    HoodieCLI.initFS(initialized);
    HoodieCLI.setTableMetadata(new HoodieTableMetaClient(HoodieCLI.conf, path));
    HoodieCLI.state = HoodieCLI.CLIState.DATASET;
-    return "Metadata for table " + HoodieCLI.tableMetadata.getTableConfig().getTableName()
-        + " loaded";
+    return "Metadata for table " + HoodieCLI.tableMetadata.getTableConfig().getTableName() + " loaded";
  }
 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HDFSParquetImportCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HDFSParquetImportCommand.java
@@ -37,44 +37,33 @@ public class HDFSParquetImportCommand implements CommandMarker {

  @CliCommand(value = "hdfsparquetimport", help = "Imports hdfs dataset to a hoodie dataset")
  public String convert(
-      @CliOption(key = "srcPath", mandatory = true, help = "Base path for the input dataset")
-      final String srcPath,
-      @CliOption(key = "srcType", mandatory = true, help = "Source type for the input dataset")
-      final String srcType,
-      @CliOption(key = "targetPath", mandatory = true, help = "Base path for the target hoodie dataset")
-      final String targetPath,
-      @CliOption(key = "tableName", mandatory = true, help = "Table name")
-      final String tableName,
-      @CliOption(key = "tableType", mandatory = true, help = "Table type")
-      final String tableType,
-      @CliOption(key = "rowKeyField", mandatory = true, help = "Row key field name")
-      final String rowKeyField,
-      @CliOption(key = "partitionPathField", mandatory = true, help = "Partition path field name")
-      final String partitionPathField,
-      @CliOption(key = {"parallelism"}, mandatory = true, help = "Parallelism for hoodie insert")
-      final String parallelism,
-      @CliOption(key = "schemaFilePath", mandatory = true, help = "Path for Avro schema file")
-      final String schemaFilePath,
-      @CliOption(key = "format", mandatory = true, help = "Format for the input data")
-      final String format,
-      @CliOption(key = "sparkMemory", mandatory = true, help = "Spark executor memory")
-      final String sparkMemory,
-      @CliOption(key = "retry", mandatory = true, help = "Number of retries")
-      final String retry)
-      throws Exception {
+      @CliOption(key = "srcPath", mandatory = true, help = "Base path for the input dataset") final String srcPath,
+      @CliOption(key = "srcType", mandatory = true, help = "Source type for the input dataset") final String srcType,
+      @CliOption(key = "targetPath", mandatory = true, help = "Base path for the target hoodie dataset") final String
+          targetPath,
+      @CliOption(key = "tableName", mandatory = true, help = "Table name") final String tableName,
+      @CliOption(key = "tableType", mandatory = true, help = "Table type") final String tableType,
+      @CliOption(key = "rowKeyField", mandatory = true, help = "Row key field name") final String rowKeyField,
+      @CliOption(key = "partitionPathField", mandatory = true, help = "Partition path field name") final String
+          partitionPathField,
+      @CliOption(key = {
+          "parallelism"}, mandatory = true, help = "Parallelism for hoodie insert") final String parallelism,
+      @CliOption(key = "schemaFilePath", mandatory = true, help = "Path for Avro schema file") final String
+          schemaFilePath,
+      @CliOption(key = "format", mandatory = true, help = "Format for the input data") final String format,
+      @CliOption(key = "sparkMemory", mandatory = true, help = "Spark executor memory") final String sparkMemory,
+      @CliOption(key = "retry", mandatory = true, help = "Number of retries") final String retry) throws Exception {

    validate(format, srcType);

    boolean initialized = HoodieCLI.initConf();
    HoodieCLI.initFS(initialized);
-    String sparkPropertiesPath = Utils
-        .getDefaultPropertiesFile(
+    String sparkPropertiesPath = Utils.getDefaultPropertiesFile(
        scala.collection.JavaConversions.propertiesAsScalaMap(System.getProperties()));
    SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);

-    sparkLauncher.addAppArgs(SparkCommand.IMPORT.toString(), srcPath, targetPath, tableName,
-        tableType, rowKeyField, partitionPathField, parallelism, schemaFilePath, sparkMemory,
-        retry);
+    sparkLauncher.addAppArgs(SparkCommand.IMPORT.toString(), srcPath, targetPath, tableName, tableType, rowKeyField,
+        partitionPathField, parallelism, schemaFilePath, sparkMemory, retry);
    Process process = sparkLauncher.launch();
    InputStreamConsumer.captureOutput(process);
    int exitCode = process.waitFor();
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HoodieLogFileCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HoodieLogFileCommand.java
@@ -64,25 +64,25 @@ public class HoodieLogFileCommand implements CommandMarker {

  @CliCommand(value = "show logfile metadata", help = "Read commit metadata from log files")
  public String showLogFileCommits(
-      @CliOption(key = "logFilePathPattern", mandatory = true, help = "Fully qualified path for the log file")
-      final String logFilePathPattern) throws IOException {
+      @CliOption(key = "logFilePathPattern", mandatory = true, help = "Fully qualified path for the log file") final
+      String logFilePathPattern)
+      throws IOException {

    FileSystem fs = HoodieCLI.tableMetadata.getFs();
    List<String> logFilePaths = Arrays.stream(fs.globStatus(new Path(logFilePathPattern)))
        .map(status -> status.getPath().toString()).collect(Collectors.toList());
-    Map<String, List<Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>, Integer>>> commitCountAndMetadata = Maps
-        .newHashMap();
+    Map<String, List<Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType,
+        String>>, Integer>>>
+        commitCountAndMetadata = Maps.newHashMap();
    int totalEntries = 0;
    int numCorruptBlocks = 0;

    for (String logFilePath : logFilePaths) {
-      FileStatus[] fsStatus = fs.listStatus(
-          new Path(logFilePath));
-      Schema writerSchema = new AvroSchemaConverter()
-          .convert(SchemaUtil
-              .readSchemaFromLogFile(HoodieCLI.tableMetadata.getFs(), new Path(logFilePath)));
-      HoodieLogFormat.Reader reader = HoodieLogFormat.newReader(fs,
-          new HoodieLogFile(fsStatus[0].getPath()), writerSchema);
+      FileStatus[] fsStatus = fs.listStatus(new Path(logFilePath));
+      Schema writerSchema = new AvroSchemaConverter().convert(
+          SchemaUtil.readSchemaFromLogFile(HoodieCLI.tableMetadata.getFs(), new Path(logFilePath)));
+      HoodieLogFormat.Reader reader = HoodieLogFormat
+          .newReader(fs, new HoodieLogFile(fsStatus[0].getPath()), writerSchema);

      // read the avro blocks
      while (reader.hasNext()) {
@@ -104,15 +104,14 @@ public class HoodieLogFileCommand implements CommandMarker {
          }
        }
        if (commitCountAndMetadata.containsKey(instantTime)) {
-          commitCountAndMetadata.get(instantTime)
-              .add(new Tuple3<>(n.getBlockType(),
-                  new Tuple2<>(n.getLogBlockHeader(), n.getLogBlockFooter()), recordCount));
+          commitCountAndMetadata.get(instantTime).add(
+              new Tuple3<>(n.getBlockType(), new Tuple2<>(n.getLogBlockHeader(), n.getLogBlockFooter()), recordCount));
          totalEntries++;
        } else {
-          List<Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>, Integer>> list
-              = new ArrayList<>();
-          list.add(new Tuple3<>(n.getBlockType(),
-              new Tuple2<>(n.getLogBlockHeader(), n.getLogBlockFooter()), recordCount));
+          List<Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>,
+              Integer>> list = new ArrayList<>();
+          list.add(
+              new Tuple3<>(n.getBlockType(), new Tuple2<>(n.getLogBlockHeader(), n.getLogBlockFooter()), recordCount));
          commitCountAndMetadata.put(instantTime, list);
          totalEntries++;
        }
@@ -121,11 +120,12 @@ public class HoodieLogFileCommand implements CommandMarker {
    String[][] rows = new String[totalEntries + 1][];
    int i = 0;
    ObjectMapper objectMapper = new ObjectMapper();
-    for (Map.Entry<String, List<Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>, Integer>>> entry : commitCountAndMetadata
-        .entrySet()) {
+    for (Map.Entry<String, List<Tuple3<HoodieLogBlockType,
+            Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>, Integer>>> entry
+        : commitCountAndMetadata.entrySet()) {
      String instantTime = entry.getKey().toString();
-      for (Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>, Map<HeaderMetadataType, String>>, Integer> tuple3 : entry
-          .getValue()) {
+      for (Tuple3<HoodieLogBlockType, Tuple2<Map<HeaderMetadataType, String>,
+          Map<HeaderMetadataType, String>>, Integer> tuple3 : entry.getValue()) {
        String[] output = new String[5];
        output[0] = instantTime;
        output[1] = String.valueOf(tuple3._3());
@@ -136,24 +136,21 @@ public class HoodieLogFileCommand implements CommandMarker {
        i++;
      }
    }
-    return HoodiePrintHelper.print(
-        new String[]{"InstantTime", "RecordCount", "BlockType", "HeaderMetadata", "FooterMetadata"},
+    return HoodiePrintHelper
+        .print(new String[] {"InstantTime", "RecordCount", "BlockType", "HeaderMetadata", "FooterMetadata"},
            rows);
  }

  @CliCommand(value = "show logfile records", help = "Read records from log files")
-  public String showLogFileRecords(
-      @CliOption(key = {
-          "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10")
-      final Integer limit,
+  public String showLogFileRecords(@CliOption(key = {
+      "limit"}, mandatory = false, help = "Limit commits", unspecifiedDefaultValue = "10") final Integer limit,
      @CliOption(key = "logFilePathPattern", mandatory = true, help = "Fully qualified paths for the log files")
      final String logFilePathPattern,
      @CliOption(key = "mergeRecords", mandatory = false, help = "If the records in the log files should be merged",
-          unspecifiedDefaultValue = "false")
-      final Boolean shouldMerge) throws IOException {
+          unspecifiedDefaultValue = "false") final Boolean shouldMerge)
+      throws IOException {

-    System.out
-        .println("===============> Showing only " + limit + " records <===============");
+    System.out.println("===============> Showing only " + limit + " records <===============");

    FileSystem fs = HoodieCLI.tableMetadata.getFs();
    List<String> logFilePaths = Arrays.stream(fs.globStatus(new Path(logFilePathPattern)))
@@ -162,9 +159,8 @@ public class HoodieLogFileCommand implements CommandMarker {
    // TODO : readerSchema can change across blocks/log files, fix this inside Scanner
    AvroSchemaConverter converter = new AvroSchemaConverter();
    // get schema from last log file
-    Schema readerSchema = converter
-        .convert(SchemaUtil
-            .readSchemaFromLogFile(fs, new Path(logFilePaths.get(logFilePaths.size() - 1))));
+    Schema readerSchema = converter.convert(
+        SchemaUtil.readSchemaFromLogFile(fs, new Path(logFilePaths.get(logFilePaths.size() - 1))));

    List<IndexedRecord> allRecords = new ArrayList<>();

@@ -186,11 +182,10 @@ public class HoodieLogFileCommand implements CommandMarker {
      }
    } else {
      for (String logFile : logFilePaths) {
-        Schema writerSchema = new AvroSchemaConverter()
-            .convert(SchemaUtil
-                .readSchemaFromLogFile(HoodieCLI.tableMetadata.getFs(), new Path(logFile)));
-        HoodieLogFormat.Reader reader = HoodieLogFormat.newReader(fs,
-            new HoodieLogFile(new Path(logFile)), writerSchema);
+        Schema writerSchema = new AvroSchemaConverter().convert(
+            SchemaUtil.readSchemaFromLogFile(HoodieCLI.tableMetadata.getFs(), new Path(logFile)));
+        HoodieLogFormat.Reader reader = HoodieLogFormat
+            .newReader(fs, new HoodieLogFile(new Path(logFile)), writerSchema);
        // read the avro blocks
        while (reader.hasNext()) {
          HoodieLogBlock n = reader.next();
@@ -216,7 +211,6 @@ public class HoodieLogFileCommand implements CommandMarker {
      rows[i] = data;
      i++;
    }
-    return HoodiePrintHelper.print(
-        new String[]{"Records"}, rows);
+    return HoodiePrintHelper.print(new String[] {"Records"}, rows);
  }
 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HoodieSyncCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/HoodieSyncCommand.java
@@ -40,26 +40,22 @@ public class HoodieSyncCommand implements CommandMarker {

  @CliCommand(value = "sync validate", help = "Validate the sync by counting the number of records")
  public String validateSync(
-      @CliOption(key = {"mode"}, unspecifiedDefaultValue = "complete", help = "Check mode")
-      final String mode,
+      @CliOption(key = {"mode"}, unspecifiedDefaultValue = "complete", help = "Check mode") final String mode,
+      @CliOption(key = {"sourceDb"}, unspecifiedDefaultValue = "rawdata", help = "source database") final String srcDb,
      @CliOption(key = {
-          "sourceDb"}, unspecifiedDefaultValue = "rawdata", help = "source database")
-      final String srcDb,
-      @CliOption(key = {
-          "targetDb"}, unspecifiedDefaultValue = "dwh_hoodie", help = "target database")
-      final String tgtDb,
+          "targetDb"}, unspecifiedDefaultValue = "dwh_hoodie", help = "target database") final String tgtDb,
      @CliOption(key = {
          "partitionCount"}, unspecifiedDefaultValue = "5", help = "total number of recent partitions to validate")
      final int partitionCount,
      @CliOption(key = {
-          "hiveServerUrl"}, mandatory = true, help = "hiveServerURL to connect to")
-      final String hiveServerUrl,
+          "hiveServerUrl"}, mandatory = true, help = "hiveServerURL to connect to") final String hiveServerUrl,
      @CliOption(key = {
-          "hiveUser"}, mandatory = false, unspecifiedDefaultValue = "", help = "hive username to connect to")
-      final String hiveUser,
+          "hiveUser"}, mandatory = false, unspecifiedDefaultValue = "", help = "hive username to connect to") final
+      String hiveUser,
      @CliOption(key = {
-          "hivePass"}, mandatory = true, unspecifiedDefaultValue = "", help = "hive password to connect to")
-      final String hivePass) throws Exception {
+          "hivePass"}, mandatory = true, unspecifiedDefaultValue = "", help = "hive password to connect to") final
+      String hivePass)
+      throws Exception {
    HoodieTableMetaClient target = HoodieCLI.syncTableMetadata;
    HoodieTimeline targetTimeline = target.getActiveTimeline().getCommitsTimeline();
    HoodieTableMetaClient source = HoodieCLI.tableMetadata;
@@ -70,52 +66,42 @@ public class HoodieSyncCommand implements CommandMarker {
      sourceCount = HiveUtil.countRecords(hiveServerUrl, source, srcDb, hiveUser, hivePass);
      targetCount = HiveUtil.countRecords(hiveServerUrl, target, tgtDb, hiveUser, hivePass);
    } else if ("latestPartitions".equals(mode)) {
-      sourceCount = HiveUtil
-          .countRecords(hiveServerUrl, source, srcDb, partitionCount, hiveUser, hivePass);
-      targetCount = HiveUtil
-          .countRecords(hiveServerUrl, target, tgtDb, partitionCount, hiveUser, hivePass);
+      sourceCount = HiveUtil.countRecords(hiveServerUrl, source, srcDb, partitionCount, hiveUser, hivePass);
+      targetCount = HiveUtil.countRecords(hiveServerUrl, target, tgtDb, partitionCount, hiveUser, hivePass);
    }

    String targetLatestCommit =
-        targetTimeline.getInstants().iterator().hasNext() ? "0"
-            : targetTimeline.lastInstant().get().getTimestamp();
+        targetTimeline.getInstants().iterator().hasNext() ? "0" : targetTimeline.lastInstant().get().getTimestamp();
    String sourceLatestCommit =
-        sourceTimeline.getInstants().iterator().hasNext() ? "0"
-            : sourceTimeline.lastInstant().get().getTimestamp();
+        sourceTimeline.getInstants().iterator().hasNext() ? "0" : sourceTimeline.lastInstant().get().getTimestamp();

-    if (sourceLatestCommit != null && HoodieTimeline
-        .compareTimestamps(targetLatestCommit, sourceLatestCommit, HoodieTimeline.GREATER)) {
+    if (sourceLatestCommit != null && HoodieTimeline.compareTimestamps(targetLatestCommit, sourceLatestCommit,
+        HoodieTimeline.GREATER)) {
      // source is behind the target
-      List<HoodieInstant> commitsToCatchup =
-          targetTimeline.findInstantsAfter(sourceLatestCommit, Integer.MAX_VALUE).getInstants()
-              .collect(Collectors.toList());
+      List<HoodieInstant> commitsToCatchup = targetTimeline.findInstantsAfter(sourceLatestCommit, Integer.MAX_VALUE)
+          .getInstants().collect(Collectors.toList());
      if (commitsToCatchup.isEmpty()) {
-        return "Count difference now is (count(" + target.getTableConfig().getTableName()
-            + ") - count(" + source.getTableConfig().getTableName() + ") == " + (targetCount
-            - sourceCount);
+        return "Count difference now is (count(" + target.getTableConfig().getTableName() + ") - count("
+            + source.getTableConfig().getTableName() + ") == " + (targetCount - sourceCount);
      } else {
        long newInserts = CommitUtil.countNewRecords(target,
-            commitsToCatchup.stream().map(HoodieInstant::getTimestamp)
-                .collect(Collectors.toList()));
-        return "Count difference now is (count(" + target.getTableConfig().getTableName()
-            + ") - count(" + source.getTableConfig().getTableName() + ") == " + (targetCount
-            - sourceCount) + ". Catch up count is " + newInserts;
+            commitsToCatchup.stream().map(HoodieInstant::getTimestamp).collect(Collectors.toList()));
+        return "Count difference now is (count(" + target.getTableConfig().getTableName() + ") - count("
+            + source.getTableConfig().getTableName()
+            + ") == " + (targetCount - sourceCount) + ". Catch up count is " + newInserts;
      }
    } else {
-      List<HoodieInstant> commitsToCatchup =
-          sourceTimeline.findInstantsAfter(targetLatestCommit, Integer.MAX_VALUE).getInstants()
-              .collect(Collectors.toList());
+      List<HoodieInstant> commitsToCatchup = sourceTimeline.findInstantsAfter(targetLatestCommit, Integer.MAX_VALUE)
+          .getInstants().collect(Collectors.toList());
      if (commitsToCatchup.isEmpty()) {
-        return "Count difference now is (count(" + source.getTableConfig().getTableName()
-            + ") - count(" + target.getTableConfig().getTableName() + ") == " + (sourceCount
-            - targetCount);
+        return "Count difference now is (count(" + source.getTableConfig().getTableName() + ") - count("
+            + target.getTableConfig().getTableName() + ") == " + (sourceCount - targetCount);
      } else {
        long newInserts = CommitUtil.countNewRecords(source,
-            commitsToCatchup.stream().map(HoodieInstant::getTimestamp)
-                .collect(Collectors.toList()));
-        return "Count difference now is (count(" + source.getTableConfig().getTableName()
-            + ") - count(" + target.getTableConfig().getTableName() + ") == " + (sourceCount
-            - targetCount) + ". Catch up count is " + newInserts;
+            commitsToCatchup.stream().map(HoodieInstant::getTimestamp).collect(Collectors.toList()));
+        return "Count difference now is (count(" + source.getTableConfig().getTableName() + ") - count("
+            + target.getTableConfig().getTableName()
+            + ") == " + (sourceCount - targetCount) + ". Catch up count is " + newInserts;
      }

    }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/RepairsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/RepairsCommand.java
@@ -45,20 +45,20 @@ public class RepairsCommand implements CommandMarker {
    return HoodieCLI.tableMetadata != null;
  }

-  @CliCommand(value = "repair deduplicate", help = "De-duplicate a partition path contains duplicates & produce repaired files to replace with")
-  public String deduplicate(
+  @CliCommand(value = "repair deduplicate", help = "De-duplicate a partition path contains duplicates & produce "
+      + "repaired files to replace with")
+  public String deduplicate(@CliOption(key = {
+      "duplicatedPartitionPath"}, help = "Partition Path containing the duplicates", mandatory = true) final String
+      duplicatedPartitionPath,
      @CliOption(key = {
-          "duplicatedPartitionPath"}, help = "Partition Path containing the duplicates", mandatory = true)
-      final String duplicatedPartitionPath,
+          "repairedOutputPath"}, help = "Location to place the repaired files", mandatory = true) final String
+          repairedOutputPath,
      @CliOption(key = {
-          "repairedOutputPath"}, help = "Location to place the repaired files", mandatory = true)
-      final String repairedOutputPath,
-      @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path", mandatory = true)
-      final String sparkPropertiesPath) throws Exception {
+          "sparkProperties"}, help = "Spark Properites File Path", mandatory = true) final String sparkPropertiesPath)
+      throws Exception {
    SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
-    sparkLauncher
-        .addAppArgs(SparkMain.SparkCommand.DEDUPLICATE.toString(), duplicatedPartitionPath,
-            repairedOutputPath, HoodieCLI.tableMetadata.getBasePath());
+    sparkLauncher.addAppArgs(SparkMain.SparkCommand.DEDUPLICATE.toString(), duplicatedPartitionPath, repairedOutputPath,
+        HoodieCLI.tableMetadata.getBasePath());
    Process process = sparkLauncher.launch();
    InputStreamConsumer.captureOutput(process);
    int exitCode = process.waitFor();
@@ -71,14 +71,12 @@ public class RepairsCommand implements CommandMarker {


  @CliCommand(value = "repair addpartitionmeta", help = "Add partition metadata to a dataset, if not present")
-  public String addPartitionMeta(
-      @CliOption(key = {"dryrun"},
-          help = "Should we actually add or just print what would be done",
-          unspecifiedDefaultValue = "true")
+  public String addPartitionMeta(@CliOption(key = {
+      "dryrun"}, help = "Should we actually add or just print what would be done", unspecifiedDefaultValue = "true")
      final boolean dryRun) throws IOException {

-    String latestCommit = HoodieCLI.tableMetadata.getActiveTimeline().getCommitTimeline()
-        .lastInstant().get().getTimestamp();
+    String latestCommit = HoodieCLI.tableMetadata.getActiveTimeline().getCommitTimeline().lastInstant().get()
+        .getTimestamp();
    List<String> partitionPaths = FSUtils.getAllFoldersThreeLevelsDown(HoodieCLI.fs,
        HoodieCLI.tableMetadata.getBasePath());
    Path basePath = new Path(HoodieCLI.tableMetadata.getBasePath());
@@ -94,10 +92,7 @@ public class RepairsCommand implements CommandMarker {
      if (!HoodiePartitionMetadata.hasPartitionMetadata(HoodieCLI.fs, partitionPath)) {
        row[1] = "No";
        if (!dryRun) {
-          HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(
-              HoodieCLI.fs,
-              latestCommit,
-              basePath,
+          HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(HoodieCLI.fs, latestCommit, basePath,
              partitionPath);
          partitionMetadata.trySave(0);
        }
@@ -105,7 +100,6 @@ public class RepairsCommand implements CommandMarker {
      rows[ind++] = row;
    }

-    return HoodiePrintHelper.print(
-        new String[]{"Partition Path", "Metadata Present?", "Action"}, rows);
+    return HoodiePrintHelper.print(new String[] {"Partition Path", "Metadata Present?", "Action"}, rows);
  }
 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/SavepointsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/SavepointsCommand.java
@@ -13,6 +13,7 @@
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
+
 package com.uber.hoodie.cli.commands;

 import com.uber.hoodie.HoodieWriteClient;
@@ -60,8 +61,8 @@ public class SavepointsCommand implements CommandMarker {

  @CliAvailabilityIndicator({"savepoint rollback"})
  public boolean isRollbackToSavepointAvailable() {
-    return HoodieCLI.tableMetadata != null && !HoodieCLI.tableMetadata.getActiveTimeline()
-        .getSavePointTimeline().filterCompletedInstants().empty();
+    return HoodieCLI.tableMetadata != null && !HoodieCLI.tableMetadata.getActiveTimeline().getSavePointTimeline()
+        .filterCompletedInstants().empty();
  }

  @CliCommand(value = "savepoints show", help = "Show the savepoints")
@@ -79,17 +80,13 @@ public class SavepointsCommand implements CommandMarker {
  }

  @CliCommand(value = "savepoint create", help = "Savepoint a commit")
-  public String savepoint(
-      @CliOption(key = {"commit"}, help = "Commit to savepoint")
-      final String commitTime,
-      @CliOption(key = {"user"}, help = "User who is creating the savepoint")
-      final String user,
-      @CliOption(key = {"comments"}, help = "Comments for creating the savepoint")
-      final String comments) throws Exception {
+  public String savepoint(@CliOption(key = {"commit"}, help = "Commit to savepoint") final String commitTime,
+      @CliOption(key = {"user"}, help = "User who is creating the savepoint") final String user,
+      @CliOption(key = {"comments"}, help = "Comments for creating the savepoint") final String comments)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
    HoodieTimeline timeline = activeTimeline.getCommitTimeline().filterCompletedInstants();
-    HoodieInstant
-        commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);

    if (!timeline.containsInstant(commitInstant)) {
      return "Commit " + commitTime + " not found in Commits " + timeline;
@@ -106,22 +103,19 @@ public class SavepointsCommand implements CommandMarker {

  @CliCommand(value = "savepoint rollback", help = "Savepoint a commit")
  public String rollbackToSavepoint(
-      @CliOption(key = {"savepoint"}, help = "Savepoint to rollback")
-      final String commitTime,
-      @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path")
-      final String sparkPropertiesPath) throws Exception {
+      @CliOption(key = {"savepoint"}, help = "Savepoint to rollback") final String commitTime,
+      @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path") final String sparkPropertiesPath)
+      throws Exception {
    HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
    HoodieTimeline timeline = activeTimeline.getCommitTimeline().filterCompletedInstants();
-    HoodieInstant
-        commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);

    if (!timeline.containsInstant(commitInstant)) {
      return "Commit " + commitTime + " not found in Commits " + timeline;
    }

    SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
-    sparkLauncher.addAppArgs(SparkMain.SparkCommand.ROLLBACK_TO_SAVEPOINT.toString(),
-        commitTime,
+    sparkLauncher.addAppArgs(SparkMain.SparkCommand.ROLLBACK_TO_SAVEPOINT.toString(), commitTime,
        HoodieCLI.tableMetadata.getBasePath());
    Process process = sparkLauncher.launch();
    InputStreamConsumer.captureOutput(process);
@@ -137,18 +131,14 @@ public class SavepointsCommand implements CommandMarker {

  @CliCommand(value = "savepoints refresh", help = "Refresh the savepoints")
  public String refreshMetaClient() throws IOException {
-    HoodieTableMetaClient metadata =
-        new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
+    HoodieTableMetaClient metadata = new HoodieTableMetaClient(HoodieCLI.conf, HoodieCLI.tableMetadata.getBasePath());
    HoodieCLI.setTableMetadata(metadata);
    return "Metadata for table " + metadata.getTableConfig().getTableName() + " refreshed.";
  }

-  private static HoodieWriteClient createHoodieClient(JavaSparkContext jsc, String basePath)
-      throws Exception {
-    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath)
-        .withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build())
-        .build();
+  private static HoodieWriteClient createHoodieClient(JavaSparkContext jsc, String basePath) throws Exception {
+    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath).withIndexConfig(
+        HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build()).build();
    return new HoodieWriteClient(jsc, config, false);
  }

--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/SparkMain.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/SparkMain.java
@@ -30,18 +30,14 @@ import org.apache.spark.sql.SQLContext;

 public class SparkMain {

-  protected final static Logger LOG = Logger.getLogger(SparkMain.class);
+  protected static final Logger LOG = Logger.getLogger(SparkMain.class);


  /**
   * Commands
   */
  enum SparkCommand {
-    ROLLBACK,
-    DEDUPLICATE,
-    ROLLBACK_TO_SAVEPOINT,
-    SAVEPOINT,
-    IMPORT
+    ROLLBACK, DEDUPLICATE, ROLLBACK_TO_SAVEPOINT, SAVEPOINT, IMPORT
  }

  public static void main(String[] args) throws Exception {
@@ -67,18 +63,19 @@ public class SparkMain {
        break;
      case IMPORT:
        assert (args.length == 11);
-        returnCode = dataImport(jsc, args[1], args[2], args[3], args[4], args[5], args[6],
-            Integer.parseInt(args[7]), args[8], SparkUtil.DEFUALT_SPARK_MASTER, args[9],
-            Integer.parseInt(args[10]));
+        returnCode = dataImport(jsc, args[1], args[2], args[3], args[4], args[5], args[6], Integer.parseInt(args[7]),
+            args[8], SparkUtil.DEFUALT_SPARK_MASTER, args[9], Integer.parseInt(args[10]));
+        break;
+      default:
        break;
    }

    System.exit(returnCode);
  }

-  private static int dataImport(JavaSparkContext jsc, String srcPath, String targetPath,
-      String tableName, String tableType, String rowKey, String partitionKey, int parallelism,
-      String schemaFile, String sparkMaster, String sparkMemory, int retry) throws Exception {
+  private static int dataImport(JavaSparkContext jsc, String srcPath, String targetPath, String tableName,
+      String tableType, String rowKey, String partitionKey, int parallelism, String schemaFile, String sparkMaster,
+      String sparkMemory, int retry) throws Exception {
    HDFSParquetImporter.Config cfg = new HDFSParquetImporter.Config();
    cfg.srcPath = srcPath;
    cfg.targetPath = targetPath;
@@ -92,19 +89,15 @@ public class SparkMain {
    return new HDFSParquetImporter(cfg).dataImport(jsc, retry);
  }

-  private static int deduplicatePartitionPath(JavaSparkContext jsc,
-      String duplicatedPartitionPath,
-      String repairedOutputPath,
-      String basePath)
-      throws Exception {
-    DedupeSparkJob job = new DedupeSparkJob(basePath, duplicatedPartitionPath, repairedOutputPath,
-        new SQLContext(jsc), FSUtils.getFs(basePath, jsc.hadoopConfiguration()));
+  private static int deduplicatePartitionPath(JavaSparkContext jsc, String duplicatedPartitionPath,
+      String repairedOutputPath, String basePath) throws Exception {
+    DedupeSparkJob job = new DedupeSparkJob(basePath, duplicatedPartitionPath, repairedOutputPath, new SQLContext(jsc),
+        FSUtils.getFs(basePath, jsc.hadoopConfiguration()));
    job.fixDuplicates(true);
    return 0;
  }

-  private static int rollback(JavaSparkContext jsc, String commitTime, String basePath)
-      throws Exception {
+  private static int rollback(JavaSparkContext jsc, String commitTime, String basePath) throws Exception {
    HoodieWriteClient client = createHoodieClient(jsc, basePath);
    if (client.rollback(commitTime)) {
      LOG.info(String.format("The commit \"%s\" rolled back.", commitTime));
@@ -115,9 +108,7 @@ public class SparkMain {
    }
  }

-  private static int rollbackToSavepoint(JavaSparkContext jsc, String savepointTime,
-      String basePath)
-      throws Exception {
+  private static int rollbackToSavepoint(JavaSparkContext jsc, String savepointTime, String basePath) throws Exception {
    HoodieWriteClient client = createHoodieClient(jsc, basePath);
    if (client.rollbackToSavepoint(savepointTime)) {
      LOG.info(String.format("The commit \"%s\" rolled back.", savepointTime));
@@ -128,12 +119,9 @@ public class SparkMain {
    }
  }

-  private static HoodieWriteClient createHoodieClient(JavaSparkContext jsc, String basePath)
-      throws Exception {
-    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath)
-        .withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build())
-        .build();
+  private static HoodieWriteClient createHoodieClient(JavaSparkContext jsc, String basePath) throws Exception {
+    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath).withIndexConfig(
+        HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build()).build();
    return new HoodieWriteClient(jsc, config);
  }
 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/StatsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/StatsCommand.java
@@ -16,7 +16,6 @@

 package com.uber.hoodie.cli.commands;

-
 import com.codahale.metrics.Histogram;
 import com.codahale.metrics.Snapshot;
 import com.codahale.metrics.UniformReservoir;
@@ -44,12 +43,15 @@ import org.springframework.stereotype.Component;
@Component
 public class StatsCommand implements CommandMarker {

+  private static final int MAX_FILES = 1000000;
+
  @CliAvailabilityIndicator({"stats wa"})
  public boolean isWriteAmpAvailable() {
    return HoodieCLI.tableMetadata != null;
  }

-  @CliCommand(value = "stats wa", help = "Write Amplification. Ratio of how many records were upserted to how many records were actually written")
+  @CliCommand(value = "stats wa", help = "Write Amplification. Ratio of how many records were upserted to how many "
+      + "records were actually written")
  public String writeAmplificationStats() throws IOException {
    long totalRecordsUpserted = 0;
    long totalRecordsWritten = 0;
@@ -60,18 +62,13 @@ public class StatsCommand implements CommandMarker {
    String[][] rows = new String[new Long(timeline.countInstants()).intValue() + 1][];
    int i = 0;
    DecimalFormat df = new DecimalFormat("#.00");
-    for (HoodieInstant commitTime : timeline.getInstants().collect(
-        Collectors.toList())) {
+    for (HoodieInstant commitTime : timeline.getInstants().collect(Collectors.toList())) {
      String waf = "0";
-      HoodieCommitMetadata commit = HoodieCommitMetadata
-          .fromBytes(activeTimeline.getInstantDetails(commitTime).get());
+      HoodieCommitMetadata commit = HoodieCommitMetadata.fromBytes(activeTimeline.getInstantDetails(commitTime).get());
      if (commit.fetchTotalUpdateRecordsWritten() > 0) {
-        waf = df.format(
-            (float) commit.fetchTotalRecordsWritten() / commit
-                .fetchTotalUpdateRecordsWritten());
+        waf = df.format((float) commit.fetchTotalRecordsWritten() / commit.fetchTotalUpdateRecordsWritten());
      }
-      rows[i++] = new String[]{commitTime.getTimestamp(),
-          String.valueOf(commit.fetchTotalUpdateRecordsWritten()),
+      rows[i++] = new String[] {commitTime.getTimestamp(), String.valueOf(commit.fetchTotalUpdateRecordsWritten()),
          String.valueOf(commit.fetchTotalRecordsWritten()), waf};
      totalRecordsUpserted += commit.fetchTotalUpdateRecordsWritten();
      totalRecordsWritten += commit.fetchTotalRecordsWritten();
@@ -80,43 +77,32 @@ public class StatsCommand implements CommandMarker {
    if (totalRecordsUpserted > 0) {
      waf = df.format((float) totalRecordsWritten / totalRecordsUpserted);
    }
-    rows[i] = new String[]{"Total", String.valueOf(totalRecordsUpserted),
-        String.valueOf(totalRecordsWritten), waf};
-    return HoodiePrintHelper.print(
-        new String[]{"CommitTime", "Total Upserted", "Total Written",
-            "Write Amplifiation Factor"}, rows);
+    rows[i] = new String[] {"Total", String.valueOf(totalRecordsUpserted), String.valueOf(totalRecordsWritten), waf};
+    return HoodiePrintHelper
+        .print(new String[] {"CommitTime", "Total Upserted", "Total Written", "Write Amplifiation Factor"},
+            rows);

  }


  private String[] printFileSizeHistogram(String commitTime, Snapshot s) {
-    return new String[]{
-        commitTime,
-        NumericUtils.humanReadableByteCount(s.getMin()),
-        NumericUtils.humanReadableByteCount(s.getValue(0.1)),
-        NumericUtils.humanReadableByteCount(s.getMedian()),
-        NumericUtils.humanReadableByteCount(s.getMean()),
-        NumericUtils.humanReadableByteCount(s.get95thPercentile()),
-        NumericUtils.humanReadableByteCount(s.getMax()),
-        String.valueOf(s.size()),
-        NumericUtils.humanReadableByteCount(s.getStdDev())
-    };
+    return new String[] {commitTime, NumericUtils.humanReadableByteCount(s.getMin()),
+        NumericUtils.humanReadableByteCount(s.getValue(0.1)), NumericUtils.humanReadableByteCount(s.getMedian()),
+        NumericUtils.humanReadableByteCount(s.getMean()), NumericUtils.humanReadableByteCount(s.get95thPercentile()),
+        NumericUtils.humanReadableByteCount(s.getMax()), String.valueOf(s.size()),
+        NumericUtils.humanReadableByteCount(s.getStdDev())};
  }

  @CliCommand(value = "stats filesizes", help = "File Sizes. Display summary stats on sizes of files")
-  public String fileSizeStats(
-      @CliOption(key = {
-          "partitionPath"}, help = "regex to select files, eg: 2016/08/02", unspecifiedDefaultValue = "*/*/*")
-      final String globRegex) throws IOException {
+  public String fileSizeStats(@CliOption(key = {
+      "partitionPath"}, help = "regex to select files, eg: 2016/08/02", unspecifiedDefaultValue = "*/*/*") final
+      String globRegex) throws IOException {

    FileSystem fs = HoodieCLI.fs;
-    String globPath = String.format("%s/%s/*",
-        HoodieCLI.tableMetadata.getBasePath(),
-        globRegex);
+    String globPath = String.format("%s/%s/*", HoodieCLI.tableMetadata.getBasePath(), globRegex);
    FileStatus[] statuses = fs.globStatus(new Path(globPath));

    // max, min, #small files < 10MB, 50th, avg, 95th
-    final int MAX_FILES = 1000000;
    Histogram globalHistogram = new Histogram(new UniformReservoir(MAX_FILES));
    HashMap<String, Histogram> commitHistoMap = new HashMap<String, Histogram>();
    for (FileStatus fileStatus : statuses) {
@@ -138,8 +124,8 @@ public class StatsCommand implements CommandMarker {
    Snapshot s = globalHistogram.getSnapshot();
    rows[ind++] = printFileSizeHistogram("ALL", s);

-    return HoodiePrintHelper.print(
-        new String[]{"CommitTime", "Min", "10th", "50th", "avg", "95th", "Max", "NumFiles",
-            "StdDev"}, rows);
+    return HoodiePrintHelper
+        .print(new String[] {"CommitTime", "Min", "10th", "50th", "avg", "95th", "Max", "NumFiles", "StdDev"},
+            rows);
  }
 }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/UtilsCommand.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/commands/UtilsCommand.java
@@ -25,9 +25,7 @@ import org.springframework.stereotype.Component;
 public class UtilsCommand implements CommandMarker {

  @CliCommand(value = "utils loadClass", help = "Load a class")
-  public String loadClass(
-      @CliOption(key = {"class"}, help = "Check mode") final String clazz
-  ) throws Exception {
+  public String loadClass(@CliOption(key = {"class"}, help = "Check mode") final String clazz) throws Exception {
    Class klass = Class.forName(clazz);
    return klass.getProtectionDomain().getCodeSource().getLocation().toExternalForm();
  }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/CommitUtil.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/CommitUtil.java
@@ -25,15 +25,12 @@ import java.util.List;

 public class CommitUtil {

-  public static long countNewRecords(HoodieTableMetaClient target, List<String> commitsToCatchup)
-      throws IOException {
+  public static long countNewRecords(HoodieTableMetaClient target, List<String> commitsToCatchup) throws IOException {
    long totalNew = 0;
-    HoodieTimeline timeline = target.getActiveTimeline().reload().getCommitTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline timeline = target.getActiveTimeline().reload().getCommitTimeline().filterCompletedInstants();
    for (String commit : commitsToCatchup) {
-      HoodieCommitMetadata c = HoodieCommitMetadata.fromBytes(timeline
-          .getInstantDetails(new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commit))
-          .get());
+      HoodieCommitMetadata c = HoodieCommitMetadata.fromBytes(
+          timeline.getInstantDetails(new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commit)).get());
      totalNew += c.fetchTotalRecordsWritten() - c.fetchTotalUpdateRecordsWritten();
    }
    return totalNew;
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/HiveUtil.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/HiveUtil.java
@@ -27,7 +27,7 @@ import org.joda.time.DateTime;

 public class HiveUtil {

-  private static String driverName = "org.apache.hive.jdbc.HiveDriver";
+  private static final String driverName = "org.apache.hive.jdbc.HiveDriver";

  static {
    try {
@@ -39,8 +39,7 @@ public class HiveUtil {

  private static Connection connection;

-  private static Connection getConnection(String jdbcUrl, String user, String pass)
-      throws SQLException {
+  private static Connection getConnection(String jdbcUrl, String user, String pass) throws SQLException {
    DataSource ds = getDatasource(jdbcUrl, user, pass);
    return ds.getConnection();
  }
@@ -54,8 +53,8 @@ public class HiveUtil {
    return ds;
  }

-  public static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String dbName,
-      String user, String pass) throws SQLException {
+  public static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String dbName, String user, String pass)
+      throws SQLException {
    Connection conn = HiveUtil.getConnection(jdbcUrl, user, pass);
    ResultSet rs = null;
    Statement stmt = conn.createStatement();
@@ -64,15 +63,13 @@ public class HiveUtil {
      stmt.execute("set hive.input.format=org.apache.hadoop.hive.ql.io.HiveInputFormat");
      stmt.execute("set hive.stats.autogather=false");
      rs = stmt.executeQuery(
-          "select count(`_hoodie_commit_time`) as cnt from " + dbName + "." + source
-              .getTableConfig()
-              .getTableName());
+          "select count(`_hoodie_commit_time`) as cnt from " + dbName + "."
+              + source.getTableConfig().getTableName());
      long count = -1;
      if (rs.next()) {
        count = rs.getLong("cnt");
      }
-      System.out
-          .println("Total records in " + source.getTableConfig().getTableName() + " is " + count);
+      System.out.println("Total records in " + source.getTableConfig().getTableName() + " is " + count);
      return count;
    } finally {
      if (rs != null) {
@@ -84,22 +81,19 @@ public class HiveUtil {
    }
  }

-  public static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String srcDb,
-      int partitions, String user, String pass) throws SQLException {
+  public static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String srcDb, int partitions,
+      String user, String pass) throws SQLException {
    DateTime dateTime = DateTime.now();
-    String endDateStr =
-        dateTime.getYear() + "-" + String.format("%02d", dateTime.getMonthOfYear()) + "-" +
-            String.format("%02d", dateTime.getDayOfMonth());
+    String endDateStr = dateTime.getYear() + "-" + String.format("%02d", dateTime.getMonthOfYear()) + "-"
+        + String.format("%02d", dateTime.getDayOfMonth());
    dateTime = dateTime.minusDays(partitions);
-    String startDateStr =
-        dateTime.getYear() + "-" + String.format("%02d", dateTime.getMonthOfYear()) + "-" +
-            String.format("%02d", dateTime.getDayOfMonth());
+    String startDateStr = dateTime.getYear() + "-" + String.format("%02d", dateTime.getMonthOfYear()) + "-"
+        + String.format("%02d", dateTime.getDayOfMonth());
    System.out.println("Start date " + startDateStr + " and end date " + endDateStr);
    return countRecords(jdbcUrl, source, srcDb, startDateStr, endDateStr, user, pass);
  }

-  private static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String srcDb,
-      String startDateStr,
+  private static long countRecords(String jdbcUrl, HoodieTableMetaClient source, String srcDb, String startDateStr,
      String endDateStr, String user, String pass) throws SQLException {
    Connection conn = HiveUtil.getConnection(jdbcUrl, user, pass);
    ResultSet rs = null;
@@ -109,9 +103,8 @@ public class HiveUtil {
      stmt.execute("set hive.input.format=org.apache.hadoop.hive.ql.io.HiveInputFormat");
      stmt.execute("set hive.stats.autogather=false");
      rs = stmt.executeQuery(
-          "select count(`_hoodie_commit_time`) as cnt from " + srcDb + "." + source.getTableConfig()
-              .getTableName() + " where datestr>'" + startDateStr + "' and datestr<='"
-              + endDateStr + "'");
+          "select count(`_hoodie_commit_time`) as cnt from " + srcDb + "." + source.getTableConfig().getTableName()
+              + " where datestr>'" + startDateStr + "' and datestr<='" + endDateStr + "'");
      if (rs.next()) {
        return rs.getLong("cnt");
      }
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/InputStreamConsumer.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/InputStreamConsumer.java
@@ -24,7 +24,7 @@ import java.util.logging.Logger;

 public class InputStreamConsumer extends Thread {

-  protected final static Logger LOG = Logger.getLogger(InputStreamConsumer.class.getName());
+  protected static final Logger LOG = Logger.getLogger(InputStreamConsumer.class.getName());
  private InputStream is;

  public InputStreamConsumer(InputStream is) {
--- a/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/SparkUtil.java
+++ b/hoodie-cli/src/main/java/com/uber/hoodie/cli/utils/SparkUtil.java
@@ -35,12 +35,9 @@ public class SparkUtil {
   * TODO: Need to fix a bunch of hardcoded stuff here eg: history server, spark distro
   */
  public static SparkLauncher initLauncher(String propertiesFile) throws URISyntaxException {
-    String currentJar = new File(
-        SparkUtil.class.getProtectionDomain().getCodeSource().getLocation().toURI().getPath())
+    String currentJar = new File(SparkUtil.class.getProtectionDomain().getCodeSource().getLocation().toURI().getPath())
        .getAbsolutePath();
-    SparkLauncher sparkLauncher =
-        new SparkLauncher().setAppResource(currentJar)
-            .setMainClass(SparkMain.class.getName())
+    SparkLauncher sparkLauncher = new SparkLauncher().setAppResource(currentJar).setMainClass(SparkMain.class.getName())
        .setPropertiesFile(propertiesFile);
    File libDirectory = new File(new File(currentJar).getParent(), "lib");
    for (String library : libDirectory.list()) {
@@ -60,8 +57,7 @@ public class SparkUtil {
    // Configure hadoop conf
    sparkConf.set("spark.hadoop.mapred.output.compress", "true");
    sparkConf.set("spark.hadoop.mapred.output.compression.codec", "true");
-    sparkConf.set("spark.hadoop.mapred.output.compression.codec",
-        "org.apache.hadoop.io.compress.GzipCodec");
+    sparkConf.set("spark.hadoop.mapred.output.compression.codec", "org.apache.hadoop.io.compress.GzipCodec");
    sparkConf.set("spark.hadoop.mapred.output.compression.type", "BLOCK");

    sparkConf = HoodieWriteClient.registerClasses(sparkConf);
--- a/hoodie-client/src/main/java/com/uber/hoodie/HoodieReadClient.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/HoodieReadClient.java
@@ -50,17 +50,17 @@ import scala.Tuple2;
 */
 public class HoodieReadClient<T extends HoodieRecordPayload> implements Serializable {

-  private static Logger logger = LogManager.getLogger(HoodieReadClient.class);
+  private static final Logger logger = LogManager.getLogger(HoodieReadClient.class);

-  private transient final JavaSparkContext jsc;
+  private final transient JavaSparkContext jsc;

-  private transient final FileSystem fs;
+  private final transient FileSystem fs;
  /**
   * TODO: We need to persist the index type into hoodie.properties and be able to access the index
   * just with a simple basepath pointing to the dataset. Until, then just always assume a
   * BloomIndex
   */
-  private transient final HoodieIndex<T> index;
+  private final transient HoodieIndex<T> index;
  private final HoodieTimeline commitTimeline;
  private HoodieTable hoodieTable;
  private transient Optional<SQLContext> sqlContextOpt;
@@ -69,8 +69,7 @@ public class HoodieReadClient<T extends HoodieRecordPayload> implements Serializ
   * @param basePath path to Hoodie dataset
   */
  public HoodieReadClient(JavaSparkContext jsc, String basePath) {
-    this(jsc, HoodieWriteConfig.newBuilder()
-        .withPath(basePath)
+    this(jsc, HoodieWriteConfig.newBuilder().withPath(basePath)
        // by default we use HoodieBloomIndex
        .withIndexConfig(
            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build())
@@ -78,7 +77,6 @@ public class HoodieReadClient<T extends HoodieRecordPayload> implements Serializ
  }

  /**
-   *
   * @param jsc
   * @param basePath
   * @param sqlContext
@@ -96,8 +94,8 @@ public class HoodieReadClient<T extends HoodieRecordPayload> implements Serializ
    this.jsc = jsc;
    this.fs = FSUtils.getFs(basePath, jsc.hadoopConfiguration());
    // Create a Hoodie table which encapsulated the commits and files visible
-    this.hoodieTable = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath, true),
+    this.hoodieTable = HoodieTable
+        .getHoodieTable(new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath, true),
            clientConfig);
    this.commitTimeline = hoodieTable.getCommitTimeline().filterCompletedInstants();
    this.index = HoodieIndex.createIndex(clientConfig, jsc);
@@ -126,33 +124,27 @@ public class HoodieReadClient<T extends HoodieRecordPayload> implements Serializ
   *
   * @return a dataframe
   */
-  public Dataset<Row> read(JavaRDD<HoodieKey> hoodieKeys, int parallelism)
-      throws Exception {
+  public Dataset<Row> read(JavaRDD<HoodieKey> hoodieKeys, int parallelism) throws Exception {

    assertSqlContext();
-    JavaPairRDD<HoodieKey, Optional<String>> keyToFileRDD =
-        index.fetchRecordLocation(hoodieKeys, hoodieTable);
-    List<String> paths = keyToFileRDD
-        .filter(keyFileTuple -> keyFileTuple._2().isPresent())
-        .map(keyFileTuple -> keyFileTuple._2().get())
-        .collect();
+    JavaPairRDD<HoodieKey, Optional<String>> keyToFileRDD = index
+        .fetchRecordLocation(hoodieKeys, hoodieTable);
+    List<String> paths = keyToFileRDD.filter(keyFileTuple -> keyFileTuple._2().isPresent())
+        .map(keyFileTuple -> keyFileTuple._2().get()).collect();

    // record locations might be same for multiple keys, so need a unique list
    Set<String> uniquePaths = new HashSet<>(paths);
    Dataset<Row> originalDF = sqlContextOpt.get().read()
        .parquet(uniquePaths.toArray(new String[uniquePaths.size()]));
    StructType schema = originalDF.schema();
-    JavaPairRDD<HoodieKey, Row> keyRowRDD = originalDF.javaRDD()
-        .mapToPair(row -> {
-          HoodieKey key = new HoodieKey(
-              row.getAs(HoodieRecord.RECORD_KEY_METADATA_FIELD),
+    JavaPairRDD<HoodieKey, Row> keyRowRDD = originalDF.javaRDD().mapToPair(row -> {
+      HoodieKey key = new HoodieKey(row.getAs(HoodieRecord.RECORD_KEY_METADATA_FIELD),
          row.getAs(HoodieRecord.PARTITION_PATH_METADATA_FIELD));
      return new Tuple2<>(key, row);
    });

    // Now, we need to further filter out, for only rows that match the supplied hoodie keys
-    JavaRDD<Row> rowRDD = keyRowRDD.join(keyToFileRDD, parallelism)
-        .map(tuple -> tuple._2()._1());
+    JavaRDD<Row> rowRDD = keyRowRDD.join(keyToFileRDD, parallelism).map(tuple -> tuple._2()._1());

    return sqlContextOpt.get().createDataFrame(rowRDD, schema);
  }
--- a/hoodie-client/src/main/java/com/uber/hoodie/HoodieWriteClient.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/HoodieWriteClient.java
@@ -81,18 +81,18 @@ import scala.Tuple2;
 /**
 * Hoodie Write Client helps you build datasets on HDFS [insert()] and then perform efficient
 * mutations on a HDFS dataset [upsert()]
- *
+ * <p>
 * Note that, at any given time, there can only be one Spark job performing these operatons on a
 * Hoodie dataset.
 */
 public class HoodieWriteClient<T extends HoodieRecordPayload> implements Serializable {

  private static Logger logger = LogManager.getLogger(HoodieWriteClient.class);
-  private transient final FileSystem fs;
-  private transient final JavaSparkContext jsc;
+  private final transient FileSystem fs;
+  private final transient JavaSparkContext jsc;
  private final HoodieWriteConfig config;
-  private transient final HoodieMetrics metrics;
-  private transient final HoodieIndex<T> index;
+  private final transient HoodieMetrics metrics;
+  private final transient HoodieIndex<T> index;
  private transient Timer.Context writeContext = null;

  /**
@@ -100,8 +100,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * @param clientConfig
   * @throws Exception
   */
-  public HoodieWriteClient(JavaSparkContext jsc, HoodieWriteConfig clientConfig)
-      throws Exception {
+  public HoodieWriteClient(JavaSparkContext jsc, HoodieWriteConfig clientConfig) throws Exception {
    this(jsc, clientConfig, false);
  }

@@ -129,6 +128,12 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    }
  }

+  public static SparkConf registerClasses(SparkConf conf) {
+    conf.registerKryoClasses(
+        new Class[] {HoodieWriteConfig.class, HoodieRecord.class, HoodieKey.class});
+    return conf;
+  }
+
  /**
   * Filter out HoodieRecords that already exists in the output folder. This is useful in
   * deduplication.
@@ -139,8 +144,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  public JavaRDD<HoodieRecord<T>> filterExists(JavaRDD<HoodieRecord<T>> hoodieRecords) {
    // Create a Hoodie table which encapsulated the commits and files visible
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);

    JavaRDD<HoodieRecord<T>> recordsWithLocation = index.tagLocation(hoodieRecords, table);
    return recordsWithLocation.filter(v1 -> !v1.isCurrentLocationKnown());
@@ -153,9 +157,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    HoodieTable<T> table = getTableAndInitCtx();
    try {
      // De-dupe/merge if needed
-      JavaRDD<HoodieRecord<T>> dedupedRecords =
-          combineOnCondition(config.shouldCombineBeforeUpsert(), records,
-              config.getUpsertShuffleParallelism());
+      JavaRDD<HoodieRecord<T>> dedupedRecords = combineOnCondition(
+          config.shouldCombineBeforeUpsert(), records, config.getUpsertShuffleParallelism());

      // perform index loop up to get existing location of records
      JavaRDD<HoodieRecord<T>> taggedRecords = index.tagLocation(dedupedRecords, table);
@@ -170,7 +173,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

  /**
   * Upserts the given prepared records into the Hoodie table, at the supplied commitTime.
-   *
+   * <p>
   * This implementation requires that the input records are already tagged, and de-duped if
   * needed.
   *
@@ -187,15 +190,15 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      if (e instanceof HoodieUpsertException) {
        throw (HoodieUpsertException) e;
      }
-      throw new HoodieUpsertException("Failed to upsert prepared records for commit time " +
-          commitTime, e);
+      throw new HoodieUpsertException(
+          "Failed to upsert prepared records for commit time " + commitTime, e);
    }
  }

  /**
   * Inserts the given HoodieRecords, into the table. This API is intended to be used for normal
   * writes.
-   *
+   * <p>
   * This implementation skips the index check and is able to leverage benefits such as small file
   * handling/blocking alignment, as with upsert(), by profiling the workload
   *
@@ -207,9 +210,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    HoodieTable<T> table = getTableAndInitCtx();
    try {
      // De-dupe/merge if needed
-      JavaRDD<HoodieRecord<T>> dedupedRecords =
-          combineOnCondition(config.shouldCombineBeforeInsert(), records,
-              config.getInsertShuffleParallelism());
+      JavaRDD<HoodieRecord<T>> dedupedRecords = combineOnCondition(
+          config.shouldCombineBeforeInsert(), records, config.getInsertShuffleParallelism());

      return upsertRecordsInternal(dedupedRecords, commitTime, table, false);
    } catch (Throwable e) {
@@ -222,7 +224,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

  /**
   * Inserts the given prepared records into the Hoodie table, at the supplied commitTime.
-   *
+   * <p>
   * This implementation skips the index check, skips de-duping and is able to leverage benefits
   * such as small file handling/blocking alignment, as with insert(), by profiling the workload.
   * The prepared HoodieRecords should be de-duped if needed.
@@ -240,8 +242,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      if (e instanceof HoodieInsertException) {
        throw e;
      }
-      throw new HoodieInsertException("Failed to insert prepared records for commit time " +
-          commitTime, e);
+      throw new HoodieInsertException(
+          "Failed to insert prepared records for commit time " + commitTime, e);
    }
  }

@@ -249,7 +251,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * Loads the given HoodieRecords, as inserts into the table. This is suitable for doing big bulk
   * loads into a Hoodie table for the very first time (e.g: converting an existing dataset to
   * Hoodie).
-   *
+   * <p>
   * This implementation uses sortBy (which does range partitioning based on reservoir sampling) and
   * attempts to control the numbers of files with less memory compared to the {@link
   * HoodieWriteClient#insert(JavaRDD, String)}
@@ -267,7 +269,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * Loads the given HoodieRecords, as inserts into the table. This is suitable for doing big bulk
   * loads into a Hoodie table for the very first time (e.g: converting an existing dataset to
   * Hoodie).
-   *
+   * <p>
   * This implementation uses sortBy (which does range partitioning based on reservoir sampling) and
   * attempts to control the numbers of files with less memory compared to the {@link
   * HoodieWriteClient#insert(JavaRDD, String)}. Optionally it allows users to specify their own
@@ -280,23 +282,20 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   *                              before they are inserted into hoodie.
   * @return JavaRDD[WriteStatus] - RDD of WriteStatus to inspect errors and counts
   */
-  public JavaRDD<WriteStatus> bulkInsert(JavaRDD<HoodieRecord<T>> records,
-      final String commitTime,
+  public JavaRDD<WriteStatus> bulkInsert(JavaRDD<HoodieRecord<T>> records, final String commitTime,
      Option<UserDefinedBulkInsertPartitioner> bulkInsertPartitioner) {
    HoodieTable<T> table = getTableAndInitCtx();
    try {
      // De-dupe/merge if needed
-      JavaRDD<HoodieRecord<T>> dedupedRecords =
-          combineOnCondition(config.shouldCombineBeforeInsert(), records,
-              config.getInsertShuffleParallelism());
+      JavaRDD<HoodieRecord<T>> dedupedRecords = combineOnCondition(
+          config.shouldCombineBeforeInsert(), records, config.getInsertShuffleParallelism());

      return bulkInsertInternal(dedupedRecords, commitTime, table, bulkInsertPartitioner);
    } catch (Throwable e) {
      if (e instanceof HoodieInsertException) {
        throw e;
      }
-      throw new HoodieInsertException("Failed to bulk insert for commit time " + commitTime,
-          e);
+      throw new HoodieInsertException("Failed to bulk insert for commit time " + commitTime, e);
    }
  }

@@ -304,7 +303,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * Loads the given HoodieRecords, as inserts into the table. This is suitable for doing big bulk
   * loads into a Hoodie table for the very first time (e.g: converting an existing dataset to
   * Hoodie).  The input records should contain no duplicates if needed.
-   *
+   * <p>
   * This implementation uses sortBy (which does range partitioning based on reservoir sampling) and
   * attempts to control the numbers of files with less memory compared to the {@link
   * HoodieWriteClient#insert(JavaRDD, String)}. Optionally it allows users to specify their own
@@ -318,8 +317,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * @return JavaRDD[WriteStatus] - RDD of WriteStatus to inspect errors and counts
   */
  public JavaRDD<WriteStatus> bulkInsertPreppedRecords(JavaRDD<HoodieRecord<T>> preppedRecords,
-      final String commitTime,
-      Option<UserDefinedBulkInsertPartitioner> bulkInsertPartitioner) {
+      final String commitTime, Option<UserDefinedBulkInsertPartitioner> bulkInsertPartitioner) {
    HoodieTable<T> table = getTableAndInitCtx();
    try {
      return bulkInsertInternal(preppedRecords, commitTime, table, bulkInsertPartitioner);
@@ -327,35 +325,29 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      if (e instanceof HoodieInsertException) {
        throw e;
      }
-      throw new HoodieInsertException("Failed to bulk insert prepared records for commit time " +
-          commitTime, e);
+      throw new HoodieInsertException(
+          "Failed to bulk insert prepared records for commit time " + commitTime, e);
    }
  }

-  private JavaRDD<WriteStatus> bulkInsertInternal(
-      JavaRDD<HoodieRecord<T>> dedupedRecords,
-      String commitTime,
-      HoodieTable<T> table,
+  private JavaRDD<WriteStatus> bulkInsertInternal(JavaRDD<HoodieRecord<T>> dedupedRecords,
+      String commitTime, HoodieTable<T> table,
      Option<UserDefinedBulkInsertPartitioner> bulkInsertPartitioner) {
    final JavaRDD<HoodieRecord<T>> repartitionedRecords;
    if (bulkInsertPartitioner.isDefined()) {
-      repartitionedRecords =
-          bulkInsertPartitioner.get().repartitionRecords(dedupedRecords,
-              config.getBulkInsertShuffleParallelism());
+      repartitionedRecords = bulkInsertPartitioner.get()
+          .repartitionRecords(dedupedRecords, config.getBulkInsertShuffleParallelism());
    } else {
      // Now, sort the records and line them up nicely for loading.
-      repartitionedRecords = dedupedRecords
-          .sortBy(record -> {
+      repartitionedRecords = dedupedRecords.sortBy(record -> {
        // Let's use "partitionPath + key" as the sort key. Spark, will ensure
        // the records split evenly across RDD partitions, such that small partitions fit
        // into 1 RDD partition, while big ones spread evenly across multiple RDD partitions
-            return String
-                .format("%s+%s", record.getPartitionPath(), record.getRecordKey());
+        return String.format("%s+%s", record.getPartitionPath(), record.getRecordKey());
      }, true, config.getBulkInsertShuffleParallelism());
    }
    JavaRDD<WriteStatus> writeStatusRDD = repartitionedRecords
-        .mapPartitionsWithIndex(new BulkInsertMapFunction<T>(commitTime, config, table),
-            true)
+        .mapPartitionsWithIndex(new BulkInsertMapFunction<T>(commitTime, config, table), true)
        .flatMap(writeStatuses -> writeStatuses.iterator());

    return updateIndexAndCommitIfNeeded(writeStatusRDD, table, commitTime);
@@ -375,8 +367,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  }

  private JavaRDD<HoodieRecord<T>> combineOnCondition(boolean condition,
-      JavaRDD<HoodieRecord<T>> records,
-      int parallelism) {
+      JavaRDD<HoodieRecord<T>> records, int parallelism) {
    if (condition) {
      return deduplicateRecords(records, parallelism);
    }
@@ -390,8 +381,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * files) are rolled back based on commit time. // TODO : Create a new WorkloadProfile metadata
   * file instead of using HoodieCommitMetadata
   */
-  private void saveWorkloadProfileMetadataToInflight(WorkloadProfile profile,
-      HoodieTable<T> table, String commitTime) throws HoodieCommitException {
+  private void saveWorkloadProfileMetadataToInflight(WorkloadProfile profile, HoodieTable<T> table,
+      String commitTime) throws HoodieCommitException {
    try {
      HoodieCommitMetadata metadata = new HoodieCommitMetadata();
      profile.getPartitionPaths().stream().forEach(path -> {
@@ -416,9 +407,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  }

  private JavaRDD<WriteStatus> upsertRecordsInternal(JavaRDD<HoodieRecord<T>> preppedRecords,
-      String commitTime,
-      HoodieTable<T> hoodieTable,
-      final boolean isUpsert) {
+      String commitTime, HoodieTable<T> hoodieTable, final boolean isUpsert) {

    // Cache the tagged records, so we don't end up computing both
    // TODO: Consistent contract in HoodieWriteClient regarding preppedRecord storage level handling
@@ -441,20 +430,16 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    JavaRDD<WriteStatus> writeStatusRDD = partitionedRecords
        .mapPartitionsWithIndex((partition, recordItr) -> {
          if (isUpsert) {
-            return hoodieTable
-                .handleUpsertPartition(commitTime, partition, recordItr, partitioner);
+            return hoodieTable.handleUpsertPartition(commitTime, partition, recordItr, partitioner);
          } else {
-            return hoodieTable
-                .handleInsertPartition(commitTime, partition, recordItr, partitioner);
+            return hoodieTable.handleInsertPartition(commitTime, partition, recordItr, partitioner);
          }
-        }, true)
-        .flatMap(writeStatuses -> writeStatuses.iterator());
+        }, true).flatMap(writeStatuses -> writeStatuses.iterator());

    return updateIndexAndCommitIfNeeded(writeStatusRDD, hoodieTable, commitTime);
  }

-  private Partitioner getPartitioner(HoodieTable table, boolean isUpsert,
-      WorkloadProfile profile) {
+  private Partitioner getPartitioner(HoodieTable table, boolean isUpsert, WorkloadProfile profile) {
    if (isUpsert) {
      return table.getUpsertPartitioner(profile);
    } else {
@@ -474,13 +459,9 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

  private JavaRDD<HoodieRecord<T>> partition(JavaRDD<HoodieRecord<T>> dedupedRecords,
      Partitioner partitioner) {
-    return dedupedRecords
-        .mapToPair(record ->
-            new Tuple2<>(
-                new Tuple2<>(record.getKey(), Option.apply(record.getCurrentLocation())),
-                record))
-        .partitionBy(partitioner)
-        .map(tuple -> tuple._2());
+    return dedupedRecords.mapToPair(record -> new Tuple2<>(
+        new Tuple2<>(record.getKey(), Option.apply(record.getCurrentLocation())), record))
+        .partitionBy(partitioner).map(tuple -> tuple._2());
  }

  /**
@@ -493,12 +474,10 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  /**
   * Commit changes performed at the given commitTime marker
   */
-  public boolean commit(String commitTime,
-      JavaRDD<WriteStatus> writeStatuses,
+  public boolean commit(String commitTime, JavaRDD<WriteStatus> writeStatuses,
      Optional<HashMap<String, String>> extraMetadata) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    return commit(commitTime, writeStatuses, extraMetadata, table.getCommitActionType());
  }

@@ -508,15 +487,13 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    logger.info("Commiting " + commitTime);
    // Create a Hoodie table which encapsulated the commits and files visible
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);

    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();

-    List<Tuple2<String, HoodieWriteStat>> stats = writeStatuses
-        .mapToPair((PairFunction<WriteStatus, String, HoodieWriteStat>) writeStatus ->
-            new Tuple2<>(writeStatus.getPartitionPath(), writeStatus.getStat()))
-        .collect();
+    List<Tuple2<String, HoodieWriteStat>> stats = writeStatuses.mapToPair(
+        (PairFunction<WriteStatus, String, HoodieWriteStat>) writeStatus -> new Tuple2<>(
+            writeStatus.getPartitionPath(), writeStatus.getStat())).collect();

    HoodieCommitMetadata metadata = new HoodieCommitMetadata();
    for (Tuple2<String, HoodieWriteStat> stat : stats) {
@@ -531,8 +508,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      durationInMs.ifPresent(duration -> {
        logger.info("Finalize write elapsed time (milliseconds): " + duration);
        metrics.updateFinalizeWriteMetrics(duration, result.get());
-          }
-      );
+      });
    }

    // add in extra metadata
@@ -541,8 +517,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    }

    try {
-      activeTimeline.saveAsComplete(
-          new HoodieInstant(true, actionType, commitTime),
+      activeTimeline.saveAsComplete(new HoodieInstant(true, actionType, commitTime),
          Optional.of(metadata.toJsonString().getBytes(StandardCharsets.UTF_8)));
      // Save was a success
      // Do a inline compaction if enabled
@@ -566,9 +541,9 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      }
      if (writeContext != null) {
        long durationInMs = metrics.getDurationInMs(writeContext.stop());
-        metrics.updateCommitMetrics(
-            HoodieActiveTimeline.COMMIT_FORMATTER.parse(commitTime).getTime(), durationInMs,
-            metadata);
+        metrics
+            .updateCommitMetrics(HoodieActiveTimeline.COMMIT_FORMATTER.parse(commitTime).getTime(),
+                durationInMs, metadata);
        writeContext = null;
      }
      logger.info("Committed " + commitTime);
@@ -587,10 +562,10 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * Savepoint a specific commit. Latest version of data files as of the passed in commitTime will
   * be referenced in the savepoint and will never be cleaned. The savepointed commit will never be
   * rolledback or archived.
-   *
+   * <p>
   * This gives an option to rollback the state to the savepoint anytime. Savepoint needs to be
   * manually created and deleted.
-   *
+   * <p>
   * Savepoint should be on a commit that could not have been cleaned.
   *
   * @param user    - User creating the savepoint
@@ -599,8 +574,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  public boolean savepoint(String user, String comment) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    if (table.getCompletedCommitTimeline().empty()) {
      throw new HoodieSavepointException("Could not savepoint. Commit timeline is empty");
    }
@@ -614,10 +588,10 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   * Savepoint a specific commit. Latest version of data files as of the passed in commitTime will
   * be referenced in the savepoint and will never be cleaned. The savepointed commit will never be
   * rolledback or archived.
-   *
+   * <p>
   * This gives an option to rollback the state to the savepoint anytime. Savepoint needs to be
   * manually created and deleted.
-   *
+   * <p>
   * Savepoint should be on a commit that could not have been cleaned.
   *
   * @param commitTime - commit that should be savepointed
@@ -627,8 +601,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  public boolean savepoint(String commitTime, String user, String comment) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    Optional<HoodieInstant> cleanInstant = table.getCompletedCleanTimeline().lastInstant();

    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION,
@@ -646,8 +619,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
            table.getActiveTimeline().getInstantDetails(cleanInstant.get()).get());
        lastCommitRetained = cleanMetadata.getEarliestCommitToRetain();
      } else {
-        lastCommitRetained =
-            table.getCompletedCommitTimeline().firstInstant().get().getTimestamp();
+        lastCommitRetained = table.getCompletedCommitTimeline().firstInstant().get().getTimestamp();
      }

      // Cannot allow savepoint time on a commit that could have been cleaned
@@ -656,24 +628,23 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
          "Could not savepoint commit " + commitTime + " as this is beyond the lookup window "
              + lastCommitRetained);

-      Map<String, List<String>> latestFilesMap = jsc.parallelize(
-          FSUtils.getAllPartitionPaths(fs, table.getMetaClient().getBasePath(),
+      Map<String, List<String>> latestFilesMap = jsc.parallelize(FSUtils
+          .getAllPartitionPaths(fs, table.getMetaClient().getBasePath(),
              config.shouldAssumeDatePartitioning()))
          .mapToPair((PairFunction<String, String, List<String>>) partitionPath -> {
            // Scan all partitions files with this commit time
            logger.info("Collecting latest files in partition path " + partitionPath);
            TableFileSystemView.ReadOptimizedView view = table.getROFileSystemView();
-            List<String> latestFiles =
-                view.getLatestDataFilesBeforeOrOn(partitionPath, commitTime)
+            List<String> latestFiles = view.getLatestDataFilesBeforeOrOn(partitionPath, commitTime)
                .map(HoodieDataFile::getFileName).collect(Collectors.toList());
            return new Tuple2<>(partitionPath, latestFiles);
          }).collectAsMap();

-      HoodieSavepointMetadata metadata =
-          AvroUtils.convertSavepointMetadata(user, comment, latestFilesMap);
+      HoodieSavepointMetadata metadata = AvroUtils
+          .convertSavepointMetadata(user, comment, latestFilesMap);
      // Nothing to save in the savepoint
-      table.getActiveTimeline().saveAsComplete(
-          new HoodieInstant(true, HoodieTimeline.SAVEPOINT_ACTION, commitTime),
+      table.getActiveTimeline()
+          .saveAsComplete(new HoodieInstant(true, HoodieTimeline.SAVEPOINT_ACTION, commitTime),
              AvroUtils.serializeSavepointMetadata(metadata));
      logger.info("Savepoint " + commitTime + " created");
      return true;
@@ -691,22 +662,20 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  public void deleteSavepoint(String savepointTime) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();

-    HoodieInstant savePoint =
-        new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION, savepointTime);
-    boolean isSavepointPresent =
-        table.getCompletedSavepointTimeline().containsInstant(savePoint);
+    HoodieInstant savePoint = new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION,
+        savepointTime);
+    boolean isSavepointPresent = table.getCompletedSavepointTimeline().containsInstant(savePoint);
    if (!isSavepointPresent) {
      logger.warn("No savepoint present " + savepointTime);
      return;
    }

    activeTimeline.revertToInflight(savePoint);
-    activeTimeline.deleteInflight(
-        new HoodieInstant(true, HoodieTimeline.SAVEPOINT_ACTION, savepointTime));
+    activeTimeline
+        .deleteInflight(new HoodieInstant(true, HoodieTimeline.SAVEPOINT_ACTION, savepointTime));
    logger.info("Savepoint " + savepointTime + " deleted");
  }

@@ -719,30 +688,27 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  public boolean rollbackToSavepoint(String savepointTime) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();
    HoodieTimeline commitTimeline = table.getCommitsTimeline();

-    HoodieInstant savePoint =
-        new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION, savepointTime);
-    boolean isSavepointPresent =
-        table.getCompletedSavepointTimeline().containsInstant(savePoint);
+    HoodieInstant savePoint = new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION,
+        savepointTime);
+    boolean isSavepointPresent = table.getCompletedSavepointTimeline().containsInstant(savePoint);
    if (!isSavepointPresent) {
      throw new HoodieRollbackException("No savepoint for commitTime " + savepointTime);
    }

-    List<String> commitsToRollback =
-        commitTimeline.findInstantsAfter(savepointTime, Integer.MAX_VALUE).getInstants()
+    List<String> commitsToRollback = commitTimeline
+        .findInstantsAfter(savepointTime, Integer.MAX_VALUE).getInstants()
        .map(HoodieInstant::getTimestamp).collect(Collectors.toList());
    logger.info("Rolling back commits " + commitsToRollback);

    rollback(commitsToRollback);

    // Make sure the rollback was successful
-    Optional<HoodieInstant> lastInstant =
-        activeTimeline.reload().getCommitsTimeline().filterCompletedInstants()
-            .lastInstant();
+    Optional<HoodieInstant> lastInstant = activeTimeline.reload().getCommitsTimeline()
+        .filterCompletedInstants().lastInstant();
    Preconditions.checkArgument(lastInstant.isPresent());
    Preconditions.checkArgument(lastInstant.get().getTimestamp().equals(savepointTime),
        savepointTime + "is not the last commit after rolling back " + commitsToRollback
@@ -771,16 +737,14 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

    // Create a Hoodie table which encapsulated the commits and files visible
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();
    HoodieTimeline inflightTimeline = table.getInflightCommitTimeline();
    HoodieTimeline commitTimeline = table.getCompletedCommitTimeline();

    // Check if any of the commits is a savepoint - do not allow rollback on those commits
-    List<String> savepoints =
-        table.getCompletedSavepointTimeline().getInstants().map(HoodieInstant::getTimestamp)
-            .collect(Collectors.toList());
+    List<String> savepoints = table.getCompletedSavepointTimeline().getInstants()
+        .map(HoodieInstant::getTimestamp).collect(Collectors.toList());
    commits.forEach(s -> {
      if (savepoints.contains(s)) {
        throw new HoodieRollbackException(
@@ -800,16 +764,15 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      String lastCommit = commits.get(commits.size() - 1);
      if (!commitTimeline.empty() && !commitTimeline
          .findInstantsAfter(lastCommit, Integer.MAX_VALUE).empty()) {
-        throw new HoodieRollbackException("Found commits after time :" + lastCommit +
-            ", please rollback greater commits first");
+        throw new HoodieRollbackException(
+            "Found commits after time :" + lastCommit + ", please rollback greater commits first");
      }

      List<String> inflights = inflightTimeline.getInstants().map(HoodieInstant::getTimestamp)
          .collect(Collectors.toList());
      if (!inflights.isEmpty() && inflights.indexOf(lastCommit) != inflights.size() - 1) {
-        throw new HoodieRollbackException(
-            "Found in-flight commits after time :" + lastCommit +
-                ", please rollback greater commits first");
+        throw new HoodieRollbackException("Found in-flight commits after time :" + lastCommit
+            + ", please rollback greater commits first");
      }

      List<HoodieRollbackStat> stats = table.rollback(jsc, commits);
@@ -817,8 +780,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      // cleanup index entries
      commits.stream().forEach(s -> {
        if (!index.rollbackCommit(s)) {
-          throw new HoodieRollbackException(
-              "Rollback index changes failed, for time :" + s);
+          throw new HoodieRollbackException("Rollback index changes failed, for time :" + s);
        }
      });
      logger.info("Index rolled back for commits " + commits);
@@ -826,13 +788,12 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      Optional<Long> durationInMs = Optional.empty();
      if (context != null) {
        durationInMs = Optional.of(metrics.getDurationInMs(context.stop()));
-        Long numFilesDeleted = stats.stream()
-            .mapToLong(stat -> stat.getSuccessDeleteFiles().size())
+        Long numFilesDeleted = stats.stream().mapToLong(stat -> stat.getSuccessDeleteFiles().size())
            .sum();
        metrics.updateRollbackMetrics(durationInMs.get(), numFilesDeleted);
      }
-      HoodieRollbackMetadata rollbackMetadata =
-          AvroUtils.convertRollbackMetadata(startRollbackTime, durationInMs, commits, stats);
+      HoodieRollbackMetadata rollbackMetadata = AvroUtils
+          .convertRollbackMetadata(startRollbackTime, durationInMs, commits, stats);
      table.getActiveTimeline().saveAsComplete(
          new HoodieInstant(true, HoodieTimeline.ROLLBACK_ACTION, startRollbackTime),
          AvroUtils.serializeRollbackMetadata(rollbackMetadata));
@@ -846,8 +807,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
            table.getActiveTimeline().getRollbackTimeline().getInstants());
      }
    } catch (IOException e) {
-      throw new HoodieRollbackException("Failed to rollback " +
-          config.getBasePath() + " commits " + commits, e);
+      throw new HoodieRollbackException(
+          "Failed to rollback " + config.getBasePath() + " commits " + commits, e);
    }
  }

@@ -880,8 +841,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

      // Create a Hoodie table which encapsulated the commits and files visible
      HoodieTable<T> table = HoodieTable.getHoodieTable(
-          new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(),
-              true), config);
+          new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);

      List<HoodieCleanStat> cleanStats = table.clean(jsc);
      if (cleanStats.isEmpty()) {
@@ -896,14 +856,14 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
      }

      // Create the metadata and save it
-      HoodieCleanMetadata metadata =
-          AvroUtils.convertCleanMetadata(startCleanTime, durationInMs, cleanStats);
+      HoodieCleanMetadata metadata = AvroUtils
+          .convertCleanMetadata(startCleanTime, durationInMs, cleanStats);
      logger.info("Cleaned " + metadata.getTotalFilesDeleted() + " files");
-      metrics.updateCleanMetrics(durationInMs.orElseGet(() -> -1L),
-          metadata.getTotalFilesDeleted());
+      metrics
+          .updateCleanMetrics(durationInMs.orElseGet(() -> -1L), metadata.getTotalFilesDeleted());

-      table.getActiveTimeline().saveAsComplete(
-          new HoodieInstant(true, HoodieTimeline.CLEAN_ACTION, startCleanTime),
+      table.getActiveTimeline()
+          .saveAsComplete(new HoodieInstant(true, HoodieTimeline.CLEAN_ACTION, startCleanTime),
              AvroUtils.serializeCleanMetadata(metadata));
      logger.info("Marked clean started on " + startCleanTime + " as complete");

@@ -930,12 +890,10 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  public void startCommitWithTime(String commitTime) {
    logger.info("Generate a new commit time " + commitTime);
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();
    String commitActionType = table.getCommitActionType();
-    activeTimeline.createInflight(
-        new HoodieInstant(true, commitActionType, commitTime));
+    activeTimeline.createInflight(new HoodieInstant(true, commitActionType, commitTime));
  }

  /**
@@ -948,17 +906,16 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    return commitTime;
  }

-  /** Since MOR tableType default to {@link HoodieTimeline#DELTA_COMMIT_ACTION},
-   * we need to explicitly set to {@link HoodieTimeline#COMMIT_ACTION} for compaction
+  /**
+   * Since MOR tableType default to {@link HoodieTimeline#DELTA_COMMIT_ACTION}, we need to
+   * explicitly set to {@link HoodieTimeline#COMMIT_ACTION} for compaction
   */
  public void startCompactionWithTime(String commitTime) {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieActiveTimeline activeTimeline = table.getActiveTimeline();
    String commitActionType = HoodieTimeline.COMMIT_ACTION;
-    activeTimeline.createInflight(
-        new HoodieInstant(true, commitActionType, commitTime));
+    activeTimeline.createInflight(new HoodieInstant(true, commitActionType, commitTime));
  }

  /**
@@ -968,8 +925,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  public JavaRDD<WriteStatus> compact(String commitTime) throws IOException {
    // Create a Hoodie table which encapsulated the commits and files visible
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    JavaRDD<WriteStatus> statuses = table.compact(jsc, commitTime);
    // Trigger the insert and collect statuses
    statuses = statuses.persist(config.getWriteStatusStorageLevel());
@@ -980,9 +936,6 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

  /**
   * Commit a compaction operation
-   * @param commitTime
-   * @param writeStatuses
-   * @param extraMetadata
   */
  public void commitCompaction(String commitTime, JavaRDD<WriteStatus> writeStatuses,
      Optional<HashMap<String, String>> extraMetadata) {
@@ -992,8 +945,6 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali

  /**
   * Commit a compaction operation
-   * @param commitTime
-   * @param writeStatuses
   */
  public void commitCompaction(String commitTime, JavaRDD<WriteStatus> writeStatuses) {
    String commitCompactionActionType = HoodieActiveTimeline.COMMIT_ACTION;
@@ -1006,8 +957,8 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  private void forceCompact(String compactionCommitTime) throws IOException {
    // Create a Hoodie table which encapsulated the commits and files visible
-    HoodieTableMetaClient metaClient =
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
+        config.getBasePath(), true);
    HoodieTable<T> table = HoodieTable.getHoodieTable(metaClient, config);
    JavaRDD<WriteStatus> compactedStatuses = table.compact(jsc, compactionCommitTime);
    if (!compactedStatuses.isEmpty()) {
@@ -1029,8 +980,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
  }

  private void commitForceCompaction(JavaRDD<WriteStatus> writeStatuses,
-      HoodieTableMetaClient metaClient,
-      String compactionCommitTime) {
+      HoodieTableMetaClient metaClient, String compactionCommitTime) {
    List<HoodieWriteStat> updateStatusMap = writeStatuses.map(writeStatus -> writeStatus.getStat())
        .collect();

@@ -1054,12 +1004,6 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    }
  }

-  public static SparkConf registerClasses(SparkConf conf) {
-    conf.registerKryoClasses(
-        new Class[]{HoodieWriteConfig.class, HoodieRecord.class, HoodieKey.class});
-    return conf;
-  }
-
  /**
   * Deduplicate Hoodie records, using the given deduplication funciton.
   */
@@ -1074,13 +1018,13 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
          return new Tuple2<>(key, record);
        })
        .reduceByKey((rec1, rec2) -> {
-          @SuppressWarnings("unchecked")
-          T reducedData = (T) rec1.getData().preCombine(rec2.getData());
-          // we cannot allow the user to change the key or partitionPath, since that will affect everything
+          @SuppressWarnings("unchecked") T reducedData = (T) rec1.getData()
+              .preCombine(rec2.getData());
+          // we cannot allow the user to change the key or partitionPath, since that will affect
+          // everything
          // so pick it from one of the records.
          return new HoodieRecord<T>(rec1.getKey(), reducedData);
-        }, parallelism)
-        .map(recordTuple -> recordTuple._2());
+        }, parallelism).map(recordTuple -> recordTuple._2());
  }

  /**
@@ -1088,8 +1032,7 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
   */
  private void rollbackInflightCommits() {
    HoodieTable<T> table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
    HoodieTimeline inflightTimeline = table.getCommitsTimeline().filterInflights();
    List<String> commits = inflightTimeline.getInstants().map(HoodieInstant::getTimestamp)
        .collect(Collectors.toList());
@@ -1103,7 +1046,6 @@ public class HoodieWriteClient<T extends HoodieRecordPayload> implements Seriali
    writeContext = metrics.getCommitCtx();
    // Create a Hoodie table which encapsulated the commits and files visible
    return HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true),
-        config);
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), config.getBasePath(), true), config);
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/WriteStatus.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/WriteStatus.java
@@ -106,14 +106,14 @@ public class WriteStatus implements Serializable {
    return globalError != null;
  }

-  public void setGlobalError(Throwable t) {
-    this.globalError = t;
-  }
-
  public Throwable getGlobalError() {
    return this.globalError;
  }

+  public void setGlobalError(Throwable t) {
+    this.globalError = t;
+  }
+
  public List<HoodieRecord> getWrittenRecords() {
    return writtenRecords;
  }
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/DefaultHoodieConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/DefaultHoodieConfig.java
@@ -30,10 +30,6 @@ public class DefaultHoodieConfig implements Serializable {
    this.props = props;
  }

-  public Properties getProps() {
-    return props;
-  }
-
  public static void setDefaultOnCondition(Properties props, boolean condition, String propName,
      String defaultValue) {
    if (condition) {
@@ -48,4 +44,8 @@ public class DefaultHoodieConfig implements Serializable {
    }
  }

+  public Properties getProps() {
+    return props;
+  }
+
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieCompactionConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieCompactionConfig.java
@@ -34,81 +34,76 @@ import javax.annotation.concurrent.Immutable;
 public class HoodieCompactionConfig extends DefaultHoodieConfig {

  public static final String CLEANER_POLICY_PROP = "hoodie.cleaner.policy";
-  private static final String DEFAULT_CLEANER_POLICY =
-      HoodieCleaningPolicy.KEEP_LATEST_COMMITS.name();
-
  public static final String AUTO_CLEAN_PROP = "hoodie.clean.automatic";
-  private static final String DEFAULT_AUTO_CLEAN = "true";
-
  // Turn on inline compaction - after fw delta commits a inline compaction will be run
  public static final String INLINE_COMPACT_PROP = "hoodie.compact.inline";
-  private static final String DEFAULT_INLINE_COMPACT = "false";
-
  // Run a compaction every N delta commits
-  public static final String INLINE_COMPACT_NUM_DELTA_COMMITS_PROP = "hoodie.compact.inline.max.delta.commits";
-  private static final String DEFAULT_INLINE_COMPACT_NUM_DELTA_COMMITS = "10";
-
+  public static final String INLINE_COMPACT_NUM_DELTA_COMMITS_PROP =
+      "hoodie.compact.inline.max" + ".delta.commits";
  public static final String CLEANER_FILE_VERSIONS_RETAINED_PROP =
-      "hoodie.cleaner.fileversions.retained";
-  private static final String DEFAULT_CLEANER_FILE_VERSIONS_RETAINED = "3";
-
+      "hoodie.cleaner.fileversions" + ".retained";
  public static final String CLEANER_COMMITS_RETAINED_PROP = "hoodie.cleaner.commits.retained";
-  private static final String DEFAULT_CLEANER_COMMITS_RETAINED = "24";
-
  public static final String MAX_COMMITS_TO_KEEP = "hoodie.keep.max.commits";
-  private static final String DEFAULT_MAX_COMMITS_TO_KEEP = String.valueOf(128);
  public static final String MIN_COMMITS_TO_KEEP = "hoodie.keep.min.commits";
-  private static final String DEFAULT_MIN_COMMITS_TO_KEEP = String.valueOf(96);
  // Upsert uses this file size to compact new data onto existing files..
  public static final String PARQUET_SMALL_FILE_LIMIT_BYTES = "hoodie.parquet.small.file.limit";
  // Turned off by default
  public static final String DEFAULT_PARQUET_SMALL_FILE_LIMIT_BYTES = String.valueOf(0);
-
  /**
   * Configs related to specific table types
   **/
  // Number of inserts, that will be put each partition/bucket for writing
-  public static final String COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE = "hoodie.copyonwrite.insert.split.size";
+  public static final String COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE =
+      "hoodie.copyonwrite.insert" + ".split.size";
  // The rationale to pick the insert parallelism is the following. Writing out 100MB files,
  // with atleast 1kb records, means 100K records per file. we just overprovision to 500K
  public static final String DEFAULT_COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE = String.valueOf(500000);
-
-  // Config to control whether we control insert split sizes automatically based on average record sizes
-  public static final String COPY_ON_WRITE_TABLE_AUTO_SPLIT_INSERTS = "hoodie.copyonwrite.insert.auto.split";
+  // Config to control whether we control insert split sizes automatically based on average
+  // record sizes
+  public static final String COPY_ON_WRITE_TABLE_AUTO_SPLIT_INSERTS =
+      "hoodie.copyonwrite.insert" + ".auto.split";
  // its off by default
  public static final String DEFAULT_COPY_ON_WRITE_TABLE_AUTO_SPLIT_INSERTS = String.valueOf(false);
-
-
-  // This value is used as a guessimate for the record size, if we can't determine this from previous commits
-  public static final String COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE = "hoodie.copyonwrite.record.size.estimate";
-  // Used to determine how much more can be packed into a small file, before it exceeds the size limit.
+  // This value is used as a guessimate for the record size, if we can't determine this from
+  // previous commits
+  public static final String COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE =
+      "hoodie.copyonwrite" + ".record.size.estimate";
+  // Used to determine how much more can be packed into a small file, before it exceeds the size
+  // limit.
  public static final String DEFAULT_COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE = String
      .valueOf(1024);
-
  public static final String CLEANER_PARALLELISM = "hoodie.cleaner.parallelism";
  public static final String DEFAULT_CLEANER_PARALLELISM = String.valueOf(200);
-
  public static final String TARGET_IO_PER_COMPACTION_IN_MB_PROP = "hoodie.compaction.target.io";
  // 500GB of target IO per compaction (both read and write)
  public static final String DEFAULT_TARGET_IO_PER_COMPACTION_IN_MB = String.valueOf(500 * 1024);
-
  public static final String COMPACTION_STRATEGY_PROP = "hoodie.compaction.strategy";
  // 200GB of target IO per compaction
  public static final String DEFAULT_COMPACTION_STRATEGY = LogFileSizeBasedCompactionStrategy.class
      .getName();
-
  // used to merge records written to log file
  public static final String DEFAULT_PAYLOAD_CLASS = HoodieAvroPayload.class.getName();
  public static final String PAYLOAD_CLASS_PROP = "hoodie.compaction.payload.class";

  // used to choose a trade off between IO vs Memory when performing compaction process
-  // Depending on outputfile_size and memory provided, choose true to avoid OOM for large file size + small memory
-  public static final String COMPACTION_LAZY_BLOCK_READ_ENABLED_PROP = "hoodie.compaction.lazy.block.read";
+  // Depending on outputfile_size and memory provided, choose true to avoid OOM for large file
+  // size + small memory
+  public static final String COMPACTION_LAZY_BLOCK_READ_ENABLED_PROP =
+      "hoodie.compaction.lazy" + ".block.read";
  public static final String DEFAULT_COMPACTION_LAZY_BLOCK_READ_ENABLED = "false";
-
  // used to choose whether to enable reverse log reading (reverse log traversal)
-  public static final String COMPACTION_REVERSE_LOG_READ_ENABLED_PROP = "hoodie.compaction.reverse.log.read";
+  public static final String COMPACTION_REVERSE_LOG_READ_ENABLED_PROP =
+      "hoodie.compaction" + ".reverse.log.read";
  public static final String DEFAULT_COMPACTION_REVERSE_LOG_READ_ENABLED = "false";
+  private static final String DEFAULT_CLEANER_POLICY = HoodieCleaningPolicy.KEEP_LATEST_COMMITS
+      .name();
+  private static final String DEFAULT_AUTO_CLEAN = "true";
+  private static final String DEFAULT_INLINE_COMPACT = "false";
+  private static final String DEFAULT_INLINE_COMPACT_NUM_DELTA_COMMITS = "10";
+  private static final String DEFAULT_CLEANER_FILE_VERSIONS_RETAINED = "3";
+  private static final String DEFAULT_CLEANER_COMMITS_RETAINED = "24";
+  private static final String DEFAULT_MAX_COMMITS_TO_KEEP = String.valueOf(128);
+  private static final String DEFAULT_MIN_COMMITS_TO_KEEP = String.valueOf(96);

  private HoodieCompactionConfig(Properties props) {
    super(props);
@@ -159,8 +154,7 @@ public class HoodieCompactionConfig extends DefaultHoodieConfig {
    }

    public Builder retainFileVersions(int fileVersionsRetained) {
-      props.setProperty(CLEANER_FILE_VERSIONS_RETAINED_PROP,
-          String.valueOf(fileVersionsRetained));
+      props.setProperty(CLEANER_FILE_VERSIONS_RETAINED_PROP, String.valueOf(fileVersionsRetained));
      return this;
    }

@@ -238,22 +232,22 @@ public class HoodieCompactionConfig extends DefaultHoodieConfig {

    public HoodieCompactionConfig build() {
      HoodieCompactionConfig config = new HoodieCompactionConfig(props);
-      setDefaultOnCondition(props, !props.containsKey(AUTO_CLEAN_PROP),
-          AUTO_CLEAN_PROP, DEFAULT_AUTO_CLEAN);
-      setDefaultOnCondition(props, !props.containsKey(INLINE_COMPACT_PROP),
-          INLINE_COMPACT_PROP, DEFAULT_INLINE_COMPACT);
+      setDefaultOnCondition(props, !props.containsKey(AUTO_CLEAN_PROP), AUTO_CLEAN_PROP,
+          DEFAULT_AUTO_CLEAN);
+      setDefaultOnCondition(props, !props.containsKey(INLINE_COMPACT_PROP), INLINE_COMPACT_PROP,
+          DEFAULT_INLINE_COMPACT);
      setDefaultOnCondition(props, !props.containsKey(INLINE_COMPACT_NUM_DELTA_COMMITS_PROP),
          INLINE_COMPACT_NUM_DELTA_COMMITS_PROP, DEFAULT_INLINE_COMPACT_NUM_DELTA_COMMITS);
-      setDefaultOnCondition(props, !props.containsKey(CLEANER_POLICY_PROP),
-          CLEANER_POLICY_PROP, DEFAULT_CLEANER_POLICY);
+      setDefaultOnCondition(props, !props.containsKey(CLEANER_POLICY_PROP), CLEANER_POLICY_PROP,
+          DEFAULT_CLEANER_POLICY);
      setDefaultOnCondition(props, !props.containsKey(CLEANER_FILE_VERSIONS_RETAINED_PROP),
          CLEANER_FILE_VERSIONS_RETAINED_PROP, DEFAULT_CLEANER_FILE_VERSIONS_RETAINED);
      setDefaultOnCondition(props, !props.containsKey(CLEANER_COMMITS_RETAINED_PROP),
          CLEANER_COMMITS_RETAINED_PROP, DEFAULT_CLEANER_COMMITS_RETAINED);
-      setDefaultOnCondition(props, !props.containsKey(MAX_COMMITS_TO_KEEP),
-          MAX_COMMITS_TO_KEEP, DEFAULT_MAX_COMMITS_TO_KEEP);
-      setDefaultOnCondition(props, !props.containsKey(MIN_COMMITS_TO_KEEP),
-          MIN_COMMITS_TO_KEEP, DEFAULT_MIN_COMMITS_TO_KEEP);
+      setDefaultOnCondition(props, !props.containsKey(MAX_COMMITS_TO_KEEP), MAX_COMMITS_TO_KEEP,
+          DEFAULT_MAX_COMMITS_TO_KEEP);
+      setDefaultOnCondition(props, !props.containsKey(MIN_COMMITS_TO_KEEP), MIN_COMMITS_TO_KEEP,
+          DEFAULT_MIN_COMMITS_TO_KEEP);
      setDefaultOnCondition(props, !props.containsKey(PARQUET_SMALL_FILE_LIMIT_BYTES),
          PARQUET_SMALL_FILE_LIMIT_BYTES, DEFAULT_PARQUET_SMALL_FILE_LIMIT_BYTES);
      setDefaultOnCondition(props, !props.containsKey(COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE),
@@ -263,8 +257,8 @@ public class HoodieCompactionConfig extends DefaultHoodieConfig {
      setDefaultOnCondition(props, !props.containsKey(COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE),
          COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE,
          DEFAULT_COPY_ON_WRITE_TABLE_RECORD_SIZE_ESTIMATE);
-      setDefaultOnCondition(props, !props.containsKey(CLEANER_PARALLELISM),
-          CLEANER_PARALLELISM, DEFAULT_CLEANER_PARALLELISM);
+      setDefaultOnCondition(props, !props.containsKey(CLEANER_PARALLELISM), CLEANER_PARALLELISM,
+          DEFAULT_CLEANER_PARALLELISM);
      setDefaultOnCondition(props, !props.containsKey(COMPACTION_STRATEGY_PROP),
          COMPACTION_STRATEGY_PROP, DEFAULT_COMPACTION_STRATEGY);
      setDefaultOnCondition(props, !props.containsKey(PAYLOAD_CLASS_PROP),
@@ -277,8 +271,7 @@ public class HoodieCompactionConfig extends DefaultHoodieConfig {
          COMPACTION_REVERSE_LOG_READ_ENABLED_PROP, DEFAULT_COMPACTION_REVERSE_LOG_READ_ENABLED);

      HoodieCleaningPolicy.valueOf(props.getProperty(CLEANER_POLICY_PROP));
-      Preconditions.checkArgument(
-          Integer.parseInt(props.getProperty(MAX_COMMITS_TO_KEEP)) > Integer
+      Preconditions.checkArgument(Integer.parseInt(props.getProperty(MAX_COMMITS_TO_KEEP)) > Integer
          .parseInt(props.getProperty(MIN_COMMITS_TO_KEEP)));
      return config;
    }
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieIndexConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieIndexConfig.java
@@ -40,23 +40,25 @@ public class HoodieIndexConfig extends DefaultHoodieConfig {
  public static final String BLOOM_INDEX_PARALLELISM_PROP = "hoodie.bloom.index.parallelism";
  // Disable explicit bloom index parallelism setting by default - hoodie auto computes
  public static final String DEFAULT_BLOOM_INDEX_PARALLELISM = "0";
-  public static final String BLOOM_INDEX_PRUNE_BY_RANGES_PROP = "hoodie.bloom.index.prune.by.ranges";
+  public static final String BLOOM_INDEX_PRUNE_BY_RANGES_PROP =
+      "hoodie.bloom.index.prune.by" + ".ranges";
  public static final String DEFAULT_BLOOM_INDEX_PRUNE_BY_RANGES = "true";
  public static final String BLOOM_INDEX_USE_CACHING_PROP = "hoodie.bloom.index.use.caching";
  public static final String DEFAULT_BLOOM_INDEX_USE_CACHING = "true";
-  public static final String BLOOM_INDEX_INPUT_STORAGE_LEVEL = "hoodie.bloom.index.input.storage.level";
+  public static final String BLOOM_INDEX_INPUT_STORAGE_LEVEL =
+      "hoodie.bloom.index.input.storage" + ".level";
  public static final String DEFAULT_BLOOM_INDEX_INPUT_STORAGE_LEVEL = "MEMORY_AND_DISK_SER";

  // ***** HBase Index Configs *****
-  public final static String HBASE_ZKQUORUM_PROP = "hoodie.index.hbase.zkquorum";
-  public final static String HBASE_ZKPORT_PROP = "hoodie.index.hbase.zkport";
-  public final static String HBASE_TABLENAME_PROP = "hoodie.index.hbase.table";
-  public final static String HBASE_GET_BATCH_SIZE_PROP = "hoodie.index.hbase.get.batch.size";
-  public final static String HBASE_PUT_BATCH_SIZE_PROP = "hoodie.index.hbase.put.batch.size";
-  public final static String DEFAULT_HBASE_BATCH_SIZE = "100";
+  public static final String HBASE_ZKQUORUM_PROP = "hoodie.index.hbase.zkquorum";
+  public static final String HBASE_ZKPORT_PROP = "hoodie.index.hbase.zkport";
+  public static final String HBASE_TABLENAME_PROP = "hoodie.index.hbase.table";
+  public static final String HBASE_GET_BATCH_SIZE_PROP = "hoodie.index.hbase.get.batch.size";
+  public static final String HBASE_PUT_BATCH_SIZE_PROP = "hoodie.index.hbase.put.batch.size";
+  public static final String DEFAULT_HBASE_BATCH_SIZE = "100";

  // ***** Bucketed Index Configs *****
-  public final static String BUCKETED_INDEX_NUM_BUCKETS_PROP = "hoodie.index.bucketed.numbuckets";
+  public static final String BUCKETED_INDEX_NUM_BUCKETS_PROP = "hoodie.index.bucketed.numbuckets";

  private HoodieIndexConfig(Properties props) {
    super(props);
@@ -152,12 +154,12 @@ public class HoodieIndexConfig extends DefaultHoodieConfig {

    public HoodieIndexConfig build() {
      HoodieIndexConfig config = new HoodieIndexConfig(props);
-      setDefaultOnCondition(props, !props.containsKey(INDEX_TYPE_PROP),
-          INDEX_TYPE_PROP, DEFAULT_INDEX_TYPE);
+      setDefaultOnCondition(props, !props.containsKey(INDEX_TYPE_PROP), INDEX_TYPE_PROP,
+          DEFAULT_INDEX_TYPE);
      setDefaultOnCondition(props, !props.containsKey(BLOOM_FILTER_NUM_ENTRIES),
          BLOOM_FILTER_NUM_ENTRIES, DEFAULT_BLOOM_FILTER_NUM_ENTRIES);
-      setDefaultOnCondition(props, !props.containsKey(BLOOM_FILTER_FPP),
-          BLOOM_FILTER_FPP, DEFAULT_BLOOM_FILTER_FPP);
+      setDefaultOnCondition(props, !props.containsKey(BLOOM_FILTER_FPP), BLOOM_FILTER_FPP,
+          DEFAULT_BLOOM_FILTER_FPP);
      setDefaultOnCondition(props, !props.containsKey(BLOOM_INDEX_PARALLELISM_PROP),
          BLOOM_INDEX_PARALLELISM_PROP, DEFAULT_BLOOM_INDEX_PARALLELISM);
      setDefaultOnCondition(props, !props.containsKey(BLOOM_INDEX_PRUNE_BY_RANGES_PROP),
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieMemoryConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieMemoryConfig.java
@@ -30,8 +30,8 @@ import org.apache.spark.util.Utils;
@Immutable
 public class HoodieMemoryConfig extends DefaultHoodieConfig {

-  // This fraction is multiplied with the spark.memory.fraction to get a final fraction of heap space to use during merge
-  // This makes it easier to scale this value as one increases the spark.executor.memory
+  // This fraction is multiplied with the spark.memory.fraction to get a final fraction of heap space to use
+  // during merge. This makes it easier to scale this value as one increases the spark.executor.memory
  public static final String MAX_MEMORY_FRACTION_FOR_MERGE_PROP = "hoodie.memory.merge.fraction";
  // Default max memory fraction during hash-merge, excess spills to disk
  public static final String DEFAULT_MAX_MEMORY_FRACTION_FOR_MERGE = String.valueOf(0.6);
@@ -87,19 +87,21 @@ public class HoodieMemoryConfig extends DefaultHoodieConfig {
    }

    /**
-     * Dynamic calculation of max memory to use for for spillable map. user.available.memory =
-     * spark.executor.memory * (1 - spark.memory.fraction) spillable.available.memory =
-     * user.available.memory * hoodie.memory.fraction. Anytime the spark.executor.memory or the
-     * spark.memory.fraction is changed, the memory used for spillable map changes accordingly
+     * Dynamic calculation of max memory to use for for spillable map. user.available.memory = spark.executor.memory *
+     * (1 - spark.memory.fraction) spillable.available.memory = user.available.memory * hoodie.memory.fraction. Anytime
+     * the spark.executor.memory or the spark.memory.fraction is changed, the memory used for spillable map changes
+     * accordingly
     */
    private long getMaxMemoryAllowedForMerge(String maxMemoryFraction) {
      final String SPARK_EXECUTOR_MEMORY_PROP = "spark.executor.memory";
      final String SPARK_EXECUTOR_MEMORY_FRACTION_PROP = "spark.memory.fraction";
-      // This is hard-coded in spark code {@link https://github.com/apache/spark/blob/576c43fb4226e4efa12189b41c3bc862019862c6/core/src/main/scala/org/apache/spark/memory/UnifiedMemoryManager.scala#L231}
-      // so have to re-define this here
+      // This is hard-coded in spark code {@link
+      // https://github.com/apache/spark/blob/576c43fb4226e4efa12189b41c3bc862019862c6/core/src/main/scala/org/apache/
+      // spark/memory/UnifiedMemoryManager.scala#L231} so have to re-define this here
      final String DEFAULT_SPARK_EXECUTOR_MEMORY_FRACTION = "0.6";
-      // This is hard-coded in spark code {@link https://github.com/apache/spark/blob/576c43fb4226e4efa12189b41c3bc862019862c6/core/src/main/scala/org/apache/spark/SparkContext.scala#L471}
-      // so have to re-define this here
+      // This is hard-coded in spark code {@link
+      // https://github.com/apache/spark/blob/576c43fb4226e4efa12189b41c3bc862019862c6/core/src/main/scala/org/apache/
+      // spark/SparkContext.scala#L471} so have to re-define this here
      final String DEFAULT_SPARK_EXECUTOR_MEMORY_MB = "1024"; // in MB

      if (SparkEnv.get() != null) {
@@ -109,7 +111,8 @@ public class HoodieMemoryConfig extends DefaultHoodieConfig {
                DEFAULT_SPARK_EXECUTOR_MEMORY_MB)) * 1024
                * 1024L);
        // 0.6 is the default value used by Spark,
-        // look at {@link https://github.com/apache/spark/blob/master/core/src/main/scala/org/apache/spark/SparkConf.scala#L507}
+        // look at {@link
+        // https://github.com/apache/spark/blob/master/core/src/main/scala/org/apache/spark/SparkConf.scala#L507}
        double memoryFraction = Double
            .valueOf(SparkEnv.get().conf().get(SPARK_EXECUTOR_MEMORY_FRACTION_PROP,
                DEFAULT_SPARK_EXECUTOR_MEMORY_FRACTION));
@@ -143,5 +146,4 @@ public class HoodieMemoryConfig extends DefaultHoodieConfig {
      return config;
    }
  }
-
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieMetricsConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieMetricsConfig.java
@@ -29,22 +29,22 @@ import javax.annotation.concurrent.Immutable;
@Immutable
 public class HoodieMetricsConfig extends DefaultHoodieConfig {

-  public final static String METRIC_PREFIX = "hoodie.metrics";
-  public final static String METRICS_ON = METRIC_PREFIX + ".on";
-  public final static boolean DEFAULT_METRICS_ON = false;
-  public final static String METRICS_REPORTER_TYPE = METRIC_PREFIX + ".reporter.type";
-  public final static MetricsReporterType DEFAULT_METRICS_REPORTER_TYPE =
-      MetricsReporterType.GRAPHITE;
+  public static final String METRIC_PREFIX = "hoodie.metrics";
+  public static final String METRICS_ON = METRIC_PREFIX + ".on";
+  public static final boolean DEFAULT_METRICS_ON = false;
+  public static final String METRICS_REPORTER_TYPE = METRIC_PREFIX + ".reporter.type";
+  public static final MetricsReporterType DEFAULT_METRICS_REPORTER_TYPE = MetricsReporterType
+      .GRAPHITE;

  // Graphite
-  public final static String GRAPHITE_PREFIX = METRIC_PREFIX + ".graphite";
-  public final static String GRAPHITE_SERVER_HOST = GRAPHITE_PREFIX + ".host";
-  public final static String DEFAULT_GRAPHITE_SERVER_HOST = "localhost";
+  public static final String GRAPHITE_PREFIX = METRIC_PREFIX + ".graphite";
+  public static final String GRAPHITE_SERVER_HOST = GRAPHITE_PREFIX + ".host";
+  public static final String DEFAULT_GRAPHITE_SERVER_HOST = "localhost";

-  public final static String GRAPHITE_SERVER_PORT = GRAPHITE_PREFIX + ".port";
-  public final static int DEFAULT_GRAPHITE_SERVER_PORT = 4756;
+  public static final String GRAPHITE_SERVER_PORT = GRAPHITE_PREFIX + ".port";
+  public static final int DEFAULT_GRAPHITE_SERVER_PORT = 4756;

-  public final static String GRAPHITE_METRIC_PREFIX = GRAPHITE_PREFIX + ".metric.prefix";
+  public static final String GRAPHITE_METRIC_PREFIX = GRAPHITE_PREFIX + ".metric.prefix";

  private HoodieMetricsConfig(Properties props) {
    super(props);
@@ -103,14 +103,14 @@ public class HoodieMetricsConfig extends DefaultHoodieConfig {
      HoodieMetricsConfig config = new HoodieMetricsConfig(props);
      setDefaultOnCondition(props, !props.containsKey(METRICS_ON), METRICS_ON,
          String.valueOf(DEFAULT_METRICS_ON));
-      setDefaultOnCondition(props, !props.containsKey(METRICS_REPORTER_TYPE),
-          METRICS_REPORTER_TYPE, DEFAULT_METRICS_REPORTER_TYPE.name());
-      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_HOST),
-          GRAPHITE_SERVER_HOST, DEFAULT_GRAPHITE_SERVER_HOST);
-      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_PORT),
-          GRAPHITE_SERVER_PORT, String.valueOf(DEFAULT_GRAPHITE_SERVER_PORT));
-      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_PORT),
-          GRAPHITE_SERVER_PORT, String.valueOf(DEFAULT_GRAPHITE_SERVER_PORT));
+      setDefaultOnCondition(props, !props.containsKey(METRICS_REPORTER_TYPE), METRICS_REPORTER_TYPE,
+          DEFAULT_METRICS_REPORTER_TYPE.name());
+      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_HOST), GRAPHITE_SERVER_HOST,
+          DEFAULT_GRAPHITE_SERVER_HOST);
+      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_PORT), GRAPHITE_SERVER_PORT,
+          String.valueOf(DEFAULT_GRAPHITE_SERVER_PORT));
+      setDefaultOnCondition(props, !props.containsKey(GRAPHITE_SERVER_PORT), GRAPHITE_SERVER_PORT,
+          String.valueOf(DEFAULT_GRAPHITE_SERVER_PORT));
      return config;
    }
  }
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieStorageConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieStorageConfig.java
@@ -36,7 +36,8 @@ public class HoodieStorageConfig extends DefaultHoodieConfig {
  public static final String DEFAULT_PARQUET_PAGE_SIZE_BYTES = String.valueOf(1 * 1024 * 1024);
  // used to size log files
  public static final String LOGFILE_SIZE_MAX_BYTES = "hoodie.logfile.max.size";
-  public static final String DEFAULT_LOGFILE_SIZE_MAX_BYTES = String.valueOf(1024*1024*1024); // 1 GB
+  public static final String DEFAULT_LOGFILE_SIZE_MAX_BYTES = String
+      .valueOf(1024 * 1024 * 1024); // 1 GB
  // used to size data blocks in log file
  public static final String LOGFILE_DATA_BLOCK_SIZE_MAX_BYTES = "hoodie.logfile.data.block.max.size";
  public static final String DEFAULT_LOGFILE_DATA_BLOCK_SIZE_MAX_BYTES = String.valueOf(256 * 1024 * 1024); // 256 MB
--- a/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieWriteConfig.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/config/HoodieWriteConfig.java
@@ -16,7 +16,6 @@

 package com.uber.hoodie.config;

-
 import com.google.common.base.Preconditions;
 import com.uber.hoodie.WriteStatus;
 import com.uber.hoodie.common.model.HoodieCleaningPolicy;
@@ -24,15 +23,14 @@ import com.uber.hoodie.common.util.ReflectionUtils;
 import com.uber.hoodie.index.HoodieIndex;
 import com.uber.hoodie.io.compact.strategy.CompactionStrategy;
 import com.uber.hoodie.metrics.MetricsReporterType;
-import org.apache.spark.storage.StorageLevel;
-
-import javax.annotation.concurrent.Immutable;
 import java.io.File;
 import java.io.FileReader;
 import java.io.IOException;
 import java.io.InputStream;
 import java.util.Map;
 import java.util.Properties;
+import javax.annotation.concurrent.Immutable;
+import org.apache.spark.storage.StorageLevel;

 /**
 * Class storing configs for the {@link com.uber.hoodie.HoodieWriteClient}
@@ -40,9 +38,9 @@ import java.util.Properties;
@Immutable
 public class HoodieWriteConfig extends DefaultHoodieConfig {

+  public static final String TABLE_NAME = "hoodie.table.name";
  private static final String BASE_PATH_PROP = "hoodie.base.path";
  private static final String AVRO_SCHEMA = "hoodie.avro.schema";
-  public static final String TABLE_NAME = "hoodie.table.name";
  private static final String DEFAULT_PARALLELISM = "200";
  private static final String INSERT_PARALLELISM = "hoodie.insert.shuffle.parallelism";
  private static final String BULKINSERT_PARALLELISM = "hoodie.bulkinsert.shuffle.parallelism";
@@ -57,13 +55,16 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
  private static final String DEFAULT_WRITE_STATUS_STORAGE_LEVEL = "MEMORY_AND_DISK_SER";
  private static final String HOODIE_AUTO_COMMIT_PROP = "hoodie.auto.commit";
  private static final String DEFAULT_HOODIE_AUTO_COMMIT = "true";
-  private static final String HOODIE_ASSUME_DATE_PARTITIONING_PROP = "hoodie.assume.date.partitioning";
+  private static final String HOODIE_ASSUME_DATE_PARTITIONING_PROP =
+      "hoodie.assume.date" + ".partitioning";
  private static final String DEFAULT_ASSUME_DATE_PARTITIONING = "false";
  private static final String HOODIE_WRITE_STATUS_CLASS_PROP = "hoodie.writestatus.class";
  private static final String DEFAULT_HOODIE_WRITE_STATUS_CLASS = WriteStatus.class.getName();
-  private static final String HOODIE_COPYONWRITE_USE_TEMP_FOLDER_CREATE = "hoodie.copyonwrite.use.temp.folder.for.create";
+  private static final String HOODIE_COPYONWRITE_USE_TEMP_FOLDER_CREATE =
+      "hoodie.copyonwrite.use" + ".temp.folder.for.create";
  private static final String DEFAULT_HOODIE_COPYONWRITE_USE_TEMP_FOLDER_CREATE = "false";
-  private static final String HOODIE_COPYONWRITE_USE_TEMP_FOLDER_MERGE = "hoodie.copyonwrite.use.temp.folder.for.merge";
+  private static final String HOODIE_COPYONWRITE_USE_TEMP_FOLDER_MERGE =
+      "hoodie.copyonwrite.use" + ".temp.folder.for.merge";
  private static final String DEFAULT_HOODIE_COPYONWRITE_USE_TEMP_FOLDER_MERGE = "false";
  private static final String FINALIZE_WRITE_PARALLELISM = "hoodie.finalize.write.parallelism";
  private static final String DEFAULT_FINALIZE_WRITE_PARALLELISM = DEFAULT_PARALLELISM;
@@ -72,6 +73,10 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
    super(props);
  }

+  public static HoodieWriteConfig.Builder newBuilder() {
+    return new Builder();
+  }
+
  /**
   * base properties
   **/
@@ -137,8 +142,8 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
  }

  public boolean shouldUseTempFolderForCopyOnWrite() {
-    return shouldUseTempFolderForCopyOnWriteForCreate() ||
-        shouldUseTempFolderForCopyOnWriteForMerge();
+    return shouldUseTempFolderForCopyOnWriteForCreate()
+        || shouldUseTempFolderForCopyOnWriteForMerge();
  }

  public int getFinalizeWriteParallelism() {
@@ -154,8 +159,8 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
  }

  public int getCleanerFileVersionsRetained() {
-    return Integer.parseInt(
-        props.getProperty(HoodieCompactionConfig.CLEANER_FILE_VERSIONS_RETAINED_PROP));
+    return Integer
+        .parseInt(props.getProperty(HoodieCompactionConfig.CLEANER_FILE_VERSIONS_RETAINED_PROP));
  }

  public int getCleanerCommitsRetained() {
@@ -177,8 +182,8 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
  }

  public int getCopyOnWriteInsertSplitSize() {
-    return Integer.parseInt(
-        props.getProperty(HoodieCompactionConfig.COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE));
+    return Integer
+        .parseInt(props.getProperty(HoodieCompactionConfig.COPY_ON_WRITE_TABLE_INSERT_SPLIT_SIZE));
  }

  public int getCopyOnWriteRecordSizeEstimate() {
@@ -204,8 +209,8 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
  }

  public int getInlineCompactDeltaCommitMax() {
-    return Integer.parseInt(
-        props.getProperty(HoodieCompactionConfig.INLINE_COMPACT_NUM_DELTA_COMMITS_PROP));
+    return Integer
+        .parseInt(props.getProperty(HoodieCompactionConfig.INLINE_COMPACT_NUM_DELTA_COMMITS_PROP));
  }

  public CompactionStrategy getCompactionStrategy() {
@@ -341,10 +346,6 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
    return props.getProperty(HoodieMetricsConfig.GRAPHITE_METRIC_PREFIX);
  }
  
-  public static HoodieWriteConfig.Builder newBuilder() {
-    return new Builder();
-  }
-
  /**
   * memory configs
   */
@@ -486,15 +487,15 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {

    public Builder withUseTempFolderCopyOnWriteForCreate(
        boolean shouldUseTempFolderCopyOnWriteForCreate) {
-      props.setProperty(HOODIE_COPYONWRITE_USE_TEMP_FOLDER_CREATE, String.valueOf
-          (shouldUseTempFolderCopyOnWriteForCreate));
+      props.setProperty(HOODIE_COPYONWRITE_USE_TEMP_FOLDER_CREATE,
+          String.valueOf(shouldUseTempFolderCopyOnWriteForCreate));
      return this;
    }

    public Builder withUseTempFolderCopyOnWriteForMerge(
        boolean shouldUseTempFolderCopyOnWriteForMerge) {
-      props.setProperty(HOODIE_COPYONWRITE_USE_TEMP_FOLDER_MERGE, String.valueOf
-          (shouldUseTempFolderCopyOnWriteForMerge));
+      props.setProperty(HOODIE_COPYONWRITE_USE_TEMP_FOLDER_MERGE,
+          String.valueOf(shouldUseTempFolderCopyOnWriteForMerge));
      return this;
    }

@@ -510,8 +511,7 @@ public class HoodieWriteConfig extends DefaultHoodieConfig {
      setDefaultOnCondition(props, !props.containsKey(INSERT_PARALLELISM), INSERT_PARALLELISM,
          DEFAULT_PARALLELISM);
      setDefaultOnCondition(props, !props.containsKey(BULKINSERT_PARALLELISM),
-          BULKINSERT_PARALLELISM,
-          DEFAULT_PARALLELISM);
+          BULKINSERT_PARALLELISM, DEFAULT_PARALLELISM);
      setDefaultOnCondition(props, !props.containsKey(UPSERT_PARALLELISM), UPSERT_PARALLELISM,
          DEFAULT_PARALLELISM);
      setDefaultOnCondition(props, !props.containsKey(COMBINE_BEFORE_INSERT_PROP),
--- a/hoodie-client/src/main/java/com/uber/hoodie/func/BufferedIterator.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/func/BufferedIterator.java
@@ -21,12 +21,6 @@ import com.google.common.base.Preconditions;
 import com.uber.hoodie.common.model.HoodieRecord;
 import com.uber.hoodie.common.model.HoodieRecordPayload;
 import com.uber.hoodie.exception.HoodieException;
-import org.apache.avro.Schema;
-import org.apache.avro.generic.IndexedRecord;
-import org.apache.log4j.LogManager;
-import org.apache.log4j.Logger;
-import org.apache.spark.util.SizeEstimator;
-
 import java.util.Iterator;
 import java.util.Optional;
 import java.util.concurrent.LinkedBlockingQueue;
@@ -35,53 +29,63 @@ import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicLong;
 import java.util.concurrent.atomic.AtomicReference;
+import org.apache.avro.Schema;
+import org.apache.avro.generic.IndexedRecord;
+import org.apache.log4j.LogManager;
+import org.apache.log4j.Logger;
+import org.apache.spark.util.SizeEstimator;

 /**
- * Used for buffering input records. Buffer limit is controlled by {@link #bufferMemoryLimit}. It internally samples
- * every {@link #RECORD_SAMPLING_RATE}th record and adjusts number of records in buffer accordingly. This is done to
- * ensure that we don't OOM.
+ * Used for buffering input records. Buffer limit is controlled by {@link #bufferMemoryLimit}. It
+ * internally samples every {@link #RECORD_SAMPLING_RATE}th record and adjusts number of records in
+ * buffer accordingly. This is done to ensure that we don't OOM.
 */
-public class BufferedIterator<K extends HoodieRecordPayload, T extends HoodieRecord<K>>
-    implements Iterator<BufferedIterator.BufferedIteratorPayload<T>> {
+public class BufferedIterator<K extends HoodieRecordPayload, T extends HoodieRecord<K>> implements
+    Iterator<BufferedIterator.BufferedIteratorPayload<T>> {

-  private static Logger logger = LogManager.getLogger(BufferedIterator.class);
  // interval used for polling records in the queue.
  public static final int RECORD_POLL_INTERVAL_SEC = 5;
  // rate used for sampling records to determine avg record size in bytes.
  public static final int RECORD_SAMPLING_RATE = 64;
  // maximum records that will be cached
  private static final int RECORD_CACHING_LIMIT = 128 * 1024;
-  // It indicates number of records to cache. We will be using sampled record's average size to determine how many
+  private static Logger logger = LogManager.getLogger(BufferedIterator.class);
+  // It indicates number of records to cache. We will be using sampled record's average size to
+  // determine how many
  // records we should cache and will change (increase/decrease) permits accordingly.
  @VisibleForTesting
  public final Semaphore rateLimiter = new Semaphore(1);
  // used for sampling records with "RECORD_SAMPLING_RATE" frequency.
  public final AtomicLong samplingRecordCounter = new AtomicLong(-1);
-  // indicates rate limit (number of records to cache). it is updated whenever there is a change in avg record size.
-  @VisibleForTesting
-  public int currentRateLimit = 1;
  // internal buffer to cache buffered records.
-  private final LinkedBlockingQueue<Optional<BufferedIteratorPayload<T>>> buffer = new LinkedBlockingQueue<>();
+  private final LinkedBlockingQueue<Optional<BufferedIteratorPayload<T>>> buffer = new
+      LinkedBlockingQueue<>();
  // maximum amount of memory to be used for buffering records.
  private final long bufferMemoryLimit;
+  // original iterator from where records are read for buffering.
+  private final Iterator<T> inputIterator;
+  // it holds the root cause of the exception in case either buffering records (reading from
+  // inputIterator) fails or
+  // thread reading records from buffer fails.
+  private final AtomicReference<Exception> hasFailed = new AtomicReference(null);
+  // used for indicating that all the records from buffer are read successfully.
+  private final AtomicBoolean isDone = new AtomicBoolean(false);
+  // schema used for fetching insertValue from HoodieRecord.
+  private final Schema schema;
+  // indicates rate limit (number of records to cache). it is updated whenever there is a change
+  // in avg record size.
+  @VisibleForTesting
+  public int currentRateLimit = 1;
  // indicates avg record size in bytes. It is updated whenever a new record is sampled.
  @VisibleForTesting
  public long avgRecordSizeInBytes = 0;
  // indicates number of samples collected so far.
  private long numSamples = 0;
-  // original iterator from where records are read for buffering.
-  private final Iterator<T> inputIterator;
-  // it holds the root cause of the exception in case either buffering records (reading from inputIterator) fails or
-  // thread reading records from buffer fails.
-  private final AtomicReference<Exception> hasFailed = new AtomicReference(null);
-  // used for indicating that all the records from buffer are read successfully.
-  private final AtomicBoolean isDone = new AtomicBoolean(false);
  // next record to be read from buffer.
  private BufferedIteratorPayload<T> nextRecord;
-  // schema used for fetching insertValue from HoodieRecord.
-  private final Schema schema;

-  public BufferedIterator(final Iterator<T> iterator, final long bufferMemoryLimit, final Schema schema) {
+  public BufferedIterator(final Iterator<T> iterator, final long bufferMemoryLimit,
+      final Schema schema) {
    this.inputIterator = iterator;
    this.bufferMemoryLimit = bufferMemoryLimit;
    this.schema = schema;
@@ -92,23 +96,28 @@ public class BufferedIterator<K extends HoodieRecordPayload, T extends HoodieRec
    return this.buffer.size();
  }

-  // It samples records with "RECORD_SAMPLING_RATE" frequency and computes average record size in bytes. It is used
-  // for determining how many maximum records to buffer. Based on change in avg size it may increase or decrease
+  // It samples records with "RECORD_SAMPLING_RATE" frequency and computes average record size in
+  // bytes. It is used
+  // for determining how many maximum records to buffer. Based on change in avg size it may
+  // increase or decrease
  // available permits.
  private void adjustBufferSizeIfNeeded(final T record) throws InterruptedException {
    if (this.samplingRecordCounter.incrementAndGet() % RECORD_SAMPLING_RATE != 0) {
      return;
    }
    final long recordSizeInBytes = SizeEstimator.estimate(record);
-    final long newAvgRecordSizeInBytes =
-      Math.max(1, (avgRecordSizeInBytes * numSamples + recordSizeInBytes) / (numSamples + 1));
-    final int newRateLimit =
-      (int) Math.min(RECORD_CACHING_LIMIT, Math.max(1, this.bufferMemoryLimit / newAvgRecordSizeInBytes));
-//    System.out.println("recordSizeInBytes:" + recordSizeInBytes + ":newAvgRecordSizeInBytes:" + newAvgRecordSizeInBytes
-//      + ":newRateLimit:" + newRateLimit + ":currentRateLimit:" + currentRateLimit + ":numSamples:" + numSamples
+    final long newAvgRecordSizeInBytes = Math
+        .max(1, (avgRecordSizeInBytes * numSamples + recordSizeInBytes) / (numSamples + 1));
+    final int newRateLimit = (int) Math
+        .min(RECORD_CACHING_LIMIT, Math.max(1, this.bufferMemoryLimit / newAvgRecordSizeInBytes));
+    // System.out.println("recordSizeInBytes:" + recordSizeInBytes + ":newAvgRecordSizeInBytes:" +
+    // newAvgRecordSizeInBytes
+    //    + ":newRateLimit:" + newRateLimit + ":currentRateLimit:" + currentRateLimit +
+    // ":numSamples:" + numSamples
    //    + ":avgRecordSizeInBytes:" + avgRecordSizeInBytes);

-    // If there is any change in number of records to cache then we will either release (if it increased) or acquire
+    // If there is any change in number of records to cache then we will either release (if it
+    // increased) or acquire
    // (if it decreased) to adjust rate limiting to newly computed value.
    if (newRateLimit > currentRateLimit) {
      rateLimiter.release(newRateLimit - currentRateLimit);
@@ -120,12 +129,14 @@ public class BufferedIterator<K extends HoodieRecordPayload, T extends HoodieRec
    numSamples++;
  }

-  // inserts record into internal buffer. It also fetches insert value from the record to offload computation work on to
+  // inserts record into internal buffer. It also fetches insert value from the record to offload
+  // computation work on to
  // buffering thread.
  private void insertRecord(T t) throws Exception {
    rateLimiter.acquire();
    adjustBufferSizeIfNeeded(t);
-    // We are retrieving insert value in the record buffering thread to offload computation around schema validation
+    // We are retrieving insert value in the record buffering thread to offload computation
+    // around schema validation
    // and record creation to it.
    final BufferedIteratorPayload<T> payload = new BufferedIteratorPayload<>(t, this.schema);
    buffer.put(Optional.of(payload));
@@ -198,12 +209,15 @@ public class BufferedIterator<K extends HoodieRecordPayload, T extends HoodieRec

  public void markAsFailed(Exception e) {
    this.hasFailed.set(e);
-    // release the permits so that if the buffering thread is waiting for permits then it will get it.
+    // release the permits so that if the buffering thread is waiting for permits then it will
+    // get it.
    this.rateLimiter.release(RECORD_CACHING_LIMIT + 1);
  }

-  // Used for caching HoodieRecord along with insertValue. We need this to offload computation work to buffering thread.
+  // Used for caching HoodieRecord along with insertValue. We need this to offload computation
+  // work to buffering thread.
  static class BufferedIteratorPayload<T extends HoodieRecord> {
+
    public T record;
    public Optional<IndexedRecord> insertValue;
    // It caches the exception seen while fetching insert value.
--- a/hoodie-client/src/main/java/com/uber/hoodie/func/BulkInsertMapFunction.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/func/BulkInsertMapFunction.java
@@ -29,8 +29,8 @@ import org.apache.spark.api.java.function.Function2;
 /**
 * Map function that handles a sorted stream of HoodieRecords
 */
-public class BulkInsertMapFunction<T extends HoodieRecordPayload>
-    implements Function2<Integer, Iterator<HoodieRecord<T>>, Iterator<List<WriteStatus>>> {
+public class BulkInsertMapFunction<T extends HoodieRecordPayload> implements
+    Function2<Integer, Iterator<HoodieRecord<T>>, Iterator<List<WriteStatus>>> {

  private String commitTime;
  private HoodieWriteConfig config;
@@ -45,8 +45,7 @@ public class BulkInsertMapFunction<T extends HoodieRecordPayload>

  @Override
  public Iterator<List<WriteStatus>> call(Integer partition,
-      Iterator<HoodieRecord<T>> sortedRecordItr)
-      throws Exception {
+      Iterator<HoodieRecord<T>> sortedRecordItr) throws Exception {
    return new LazyInsertIterable<>(sortedRecordItr, config, commitTime, hoodieTable);
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/func/LazyInsertIterable.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/func/LazyInsertIterable.java
@@ -24,11 +24,6 @@ import com.uber.hoodie.exception.HoodieException;
 import com.uber.hoodie.io.HoodieCreateHandle;
 import com.uber.hoodie.io.HoodieIOHandle;
 import com.uber.hoodie.table.HoodieTable;
-import org.apache.log4j.LogManager;
-import org.apache.log4j.Logger;
-import org.apache.spark.TaskContext;
-import org.apache.spark.TaskContext$;
-
 import java.util.ArrayList;
 import java.util.HashSet;
 import java.util.Iterator;
@@ -38,6 +33,10 @@ import java.util.Set;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
 import java.util.concurrent.Future;
+import org.apache.log4j.LogManager;
+import org.apache.log4j.Logger;
+import org.apache.spark.TaskContext;
+import org.apache.spark.TaskContext$;

 /**
 * Lazy Iterable, that writes a stream of HoodieRecords sorted by the partitionPath, into new
@@ -68,21 +67,22 @@ public class LazyInsertIterable<T extends HoodieRecordPayload> extends

  @Override
  protected List<WriteStatus> computeNext() {
-    // Need to set current spark thread's TaskContext into newly launched thread so that new thread can access
+    // Need to set current spark thread's TaskContext into newly launched thread so that new
+    // thread can access
    // TaskContext properties.
    final TaskContext sparkThreadTaskContext = TaskContext.get();
    // Executor service used for launching writer thread.
    final ExecutorService writerService = Executors.newFixedThreadPool(1);
    try {
-      // Used for buffering records which is controlled by HoodieWriteConfig#WRITE_BUFFER_LIMIT_BYTES.
-      final BufferedIterator<T, HoodieRecord<T>> bufferedIterator =
-          new BufferedIterator<>(inputItr, hoodieConfig.getWriteBufferLimitBytes(),
+      // Used for buffering records which is controlled by
+      // HoodieWriteConfig#WRITE_BUFFER_LIMIT_BYTES.
+      final BufferedIterator<T, HoodieRecord<T>> bufferedIterator = new BufferedIterator<>(inputItr,
+          hoodieConfig.getWriteBufferLimitBytes(),
          HoodieIOHandle.createHoodieWriteSchema(hoodieConfig));
-      Future<List<WriteStatus>> writerResult =
-          writerService.submit(
-              () -> {
+      Future<List<WriteStatus>> writerResult = writerService.submit(() -> {
        logger.info("starting hoodie writer thread");
-                // Passing parent thread's TaskContext to newly launched thread for it to access original TaskContext
+        // Passing parent thread's TaskContext to newly launched thread for it to access original
+        // TaskContext
        // properties.
        TaskContext$.MODULE$.setTaskContext(sparkThreadTaskContext);
        List<WriteStatus> statuses = new LinkedList<>();
@@ -96,7 +96,8 @@ public class LazyInsertIterable<T extends HoodieRecordPayload> extends
          throw e;
        }
      });
-      // Buffering records into internal buffer. This can throw exception either if reading records from spark fails or
+      // Buffering records into internal buffer. This can throw exception either if reading
+      // records from spark fails or
      // if writing buffered records into parquet file fails.
      bufferedIterator.startBuffering();
      logger.info("waiting for hoodie write to finish");
@@ -110,28 +111,27 @@ public class LazyInsertIterable<T extends HoodieRecordPayload> extends
    }
  }

-  private List<WriteStatus> handleWrite(final BufferedIterator<T, HoodieRecord<T>> bufferedIterator) {
+  private List<WriteStatus> handleWrite(
+      final BufferedIterator<T, HoodieRecord<T>> bufferedIterator) {
    List<WriteStatus> statuses = new ArrayList<>();
    while (bufferedIterator.hasNext()) {
-      final BufferedIterator.BufferedIteratorPayload<HoodieRecord<T>> payload = bufferedIterator.next();
+      final BufferedIterator.BufferedIteratorPayload<HoodieRecord<T>> payload = bufferedIterator
+          .next();

      // clean up any partial failures
      if (!partitionsCleaned.contains(payload.record.getPartitionPath())) {
        // This insert task could fail multiple times, but Spark will faithfully retry with
        // the same data again. Thus, before we open any files under a given partition, we
        // first delete any files in the same partitionPath written by same Spark partition
-        HoodieIOHandle.cleanupTmpFilesFromCurrentCommit(hoodieConfig,
-            commitTime,
-            payload.record.getPartitionPath(),
-            TaskContext.getPartitionId(),
-            hoodieTable);
+        HoodieIOHandle.cleanupTmpFilesFromCurrentCommit(hoodieConfig, commitTime,
+            payload.record.getPartitionPath(), TaskContext.getPartitionId(), hoodieTable);
        partitionsCleaned.add(payload.record.getPartitionPath());
      }

      // lazily initialize the handle, for the first time
      if (handle == null) {
-        handle =
-            new HoodieCreateHandle(hoodieConfig, commitTime, hoodieTable, payload.record.getPartitionPath());
+        handle = new HoodieCreateHandle(hoodieConfig, commitTime, hoodieTable,
+            payload.record.getPartitionPath());
      }

      if (handle.canWrite(payload.record)) {
@@ -141,9 +141,10 @@ public class LazyInsertIterable<T extends HoodieRecordPayload> extends
        // handle is full.
        statuses.add(handle.close());
        // Need to handle the rejected payload & open new handle
-        handle =
-            new HoodieCreateHandle(hoodieConfig, commitTime, hoodieTable, payload.record.getPartitionPath());
-        handle.write(payload.record, payload.insertValue, payload.exception); // we should be able to write 1 payload.
+        handle = new HoodieCreateHandle(hoodieConfig, commitTime, hoodieTable,
+            payload.record.getPartitionPath());
+        handle.write(payload.record, payload.insertValue,
+            payload.exception); // we should be able to write 1 payload.
      }
    }

--- a/hoodie-client/src/main/java/com/uber/hoodie/func/LazyIterableIterator.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/func/LazyIterableIterator.java
@@ -23,9 +23,9 @@ import java.util.Iterator;
 * inputItr classes in order to simplify the implementation of lazy iterators for mapPartitions use
 * cases. Note [SPARK-3369], which gives the reasons for backwards compatibility with regard to the
 * iterable API despite Spark's single pass nature.
- *
+ * <p>
 * Provide a way to obtain a inputItr of type O  (output), out of an inputItr of type I (input)
- *
+ * <p>
 * Things to remember: - Assumes Spark calls hasNext() to check for elements, before calling next()
 * to obtain them - Assumes hasNext() gets called atleast once. - Concrete Implementation is
 * responsible for calling inputIterator.next() and doing the processing in computeNext()
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/HoodieIndex.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/HoodieIndex.java
@@ -37,22 +37,30 @@ import org.apache.spark.api.java.JavaSparkContext;
 */
 public abstract class HoodieIndex<T extends HoodieRecordPayload> implements Serializable {

-  protected transient JavaSparkContext jsc = null;
-
-  public enum IndexType {
-    HBASE,
-    INMEMORY,
-    BLOOM,
-    BUCKETED
-  }
-
  protected final HoodieWriteConfig config;
+  protected transient JavaSparkContext jsc = null;

  protected HoodieIndex(HoodieWriteConfig config, JavaSparkContext jsc) {
    this.config = config;
    this.jsc = jsc;
  }

+  public static <T extends HoodieRecordPayload> HoodieIndex<T> createIndex(HoodieWriteConfig config,
+      JavaSparkContext jsc) throws HoodieIndexException {
+    switch (config.getIndexType()) {
+      case HBASE:
+        return new HBaseIndex<>(config, jsc);
+      case INMEMORY:
+        return new InMemoryHashIndex<>(config, jsc);
+      case BLOOM:
+        return new HoodieBloomIndex<>(config, jsc);
+      case BUCKETED:
+        return new BucketedIndex<>(config, jsc);
+      default:
+        throw new HoodieIndexException("Index type unspecified, set " + config.getIndexType());
+    }
+  }
+
  /**
   * Checks if the given [Keys] exists in the hoodie table and returns [Key, Optional[FullFilePath]]
   * If the optional FullFilePath value is not present, then the key is not found. If the
@@ -71,7 +79,7 @@ public abstract class HoodieIndex<T extends HoodieRecordPayload> implements Seri

  /**
   * Extracts the location of written records, and updates the index.
-   *
+   * <p>
   * TODO(vc): We may need to propagate the record as well in a WriteStatus class
   */
  public abstract JavaRDD<WriteStatus> updateLocation(JavaRDD<WriteStatus> writeStatusRDD,
@@ -107,18 +115,7 @@ public abstract class HoodieIndex<T extends HoodieRecordPayload> implements Seri
  public abstract boolean isImplicitWithStorage();


-  public static <T extends HoodieRecordPayload> HoodieIndex<T> createIndex(
-      HoodieWriteConfig config, JavaSparkContext jsc) throws HoodieIndexException {
-    switch (config.getIndexType()) {
-      case HBASE:
-        return new HBaseIndex<>(config, jsc);
-      case INMEMORY:
-        return new InMemoryHashIndex<>(config, jsc);
-      case BLOOM:
-        return new HoodieBloomIndex<>(config, jsc);
-      case BUCKETED:
-        return new BucketedIndex<>(config, jsc);
-    }
-    throw new HoodieIndexException("Index type unspecified, set " + config.getIndexType());
+  public enum IndexType {
+    HBASE, INMEMORY, BLOOM, BUCKETED
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/InMemoryHashIndex.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/InMemoryHashIndex.java
@@ -49,32 +49,11 @@ public class InMemoryHashIndex<T extends HoodieRecordPayload> extends HoodieInde
  }

  @Override
-  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(
-      JavaRDD<HoodieKey> hoodieKeys, final HoodieTable<T> table) {
+  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(JavaRDD<HoodieKey> hoodieKeys,
+      final HoodieTable<T> table) {
    throw new UnsupportedOperationException("InMemory index does not implement check exist yet");
  }

-  /**
-   * Function that tags each HoodieRecord with an existing location, if known.
-   */
-  class LocationTagFunction
-      implements Function2<Integer, Iterator<HoodieRecord<T>>, Iterator<HoodieRecord<T>>> {
-
-    @Override
-    public Iterator<HoodieRecord<T>> call(Integer partitionNum,
-        Iterator<HoodieRecord<T>> hoodieRecordIterator) {
-      List<HoodieRecord<T>> taggedRecords = new ArrayList<>();
-      while (hoodieRecordIterator.hasNext()) {
-        HoodieRecord<T> rec = hoodieRecordIterator.next();
-        if (recordLocationMap.containsKey(rec.getKey())) {
-          rec.setCurrentLocation(recordLocationMap.get(rec.getKey()));
-        }
-        taggedRecords.add(rec);
-      }
-      return taggedRecords.iterator();
-    }
-  }
-
  @Override
  public JavaRDD<HoodieRecord<T>> tagLocation(JavaRDD<HoodieRecord<T>> recordRDD,
      HoodieTable<T> hoodieTable) {
@@ -132,4 +111,25 @@ public class InMemoryHashIndex<T extends HoodieRecordPayload> extends HoodieInde
  public boolean isImplicitWithStorage() {
    return false;
  }
+
+  /**
+   * Function that tags each HoodieRecord with an existing location, if known.
+   */
+  class LocationTagFunction implements
+      Function2<Integer, Iterator<HoodieRecord<T>>, Iterator<HoodieRecord<T>>> {
+
+    @Override
+    public Iterator<HoodieRecord<T>> call(Integer partitionNum,
+        Iterator<HoodieRecord<T>> hoodieRecordIterator) {
+      List<HoodieRecord<T>> taggedRecords = new ArrayList<>();
+      while (hoodieRecordIterator.hasNext()) {
+        HoodieRecord<T> rec = hoodieRecordIterator.next();
+        if (recordLocationMap.containsKey(rec.getKey())) {
+          rec.setCurrentLocation(recordLocationMap.get(rec.getKey()));
+        }
+        taggedRecords.add(rec);
+      }
+      return taggedRecords.iterator();
+    }
+  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/BloomIndexFileInfo.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/BloomIndexFileInfo.java
@@ -64,8 +64,7 @@ public class BloomIndexFileInfo implements Serializable {
   * Does the given key fall within the range (inclusive)
   */
  public boolean isKeyInRange(String recordKey) {
-    return minRecordKey.compareTo(recordKey) <= 0 &&
-        maxRecordKey.compareTo(recordKey) >= 0;
+    return minRecordKey.compareTo(recordKey) <= 0 && maxRecordKey.compareTo(recordKey) >= 0;
  }

  @Override
@@ -78,9 +77,8 @@ public class BloomIndexFileInfo implements Serializable {
    }

    BloomIndexFileInfo that = (BloomIndexFileInfo) o;
-    return Objects.equal(that.fileName, fileName) &&
-        Objects.equal(that.minRecordKey, minRecordKey) &&
-        Objects.equal(that.maxRecordKey, maxRecordKey);
+    return Objects.equal(that.fileName, fileName) && Objects.equal(that.minRecordKey, minRecordKey)
+        && Objects.equal(that.maxRecordKey, maxRecordKey);

  }

--- a/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/HoodieBloomIndex.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/HoodieBloomIndex.java
@@ -56,12 +56,11 @@ import scala.Tuple2;
 */
 public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {

-  private static Logger logger = LogManager.getLogger(HoodieBloomIndex.class);
-
  // we need to limit the join such that it stays within 1.5GB per Spark partition. (SPARK-1476)
  private static final int SPARK_MAXIMUM_BYTES_PER_PARTITION = 1500 * 1024 * 1024;
  // this is how much a triplet of (partitionPath, fileId, recordKey) costs.
  private static final int BYTES_PER_PARTITION_FILE_KEY_TRIPLET = 300;
+  private static Logger logger = LogManager.getLogger(HoodieBloomIndex.class);
  private static int MAX_ITEMS_PER_SHUFFLE_PARTITION =
      SPARK_MAXIMUM_BYTES_PER_PARTITION / BYTES_PER_PARTITION_FILE_KEY_TRIPLET;

@@ -108,27 +107,26 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
    return taggedRecordRDD;
  }

-  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(
-      JavaRDD<HoodieKey> hoodieKeys, final HoodieTable<T> table) {
-    JavaPairRDD<String, String> partitionRecordKeyPairRDD =
-        hoodieKeys.mapToPair(key -> new Tuple2<>(key.getPartitionPath(), key.getRecordKey()));
+  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(JavaRDD<HoodieKey> hoodieKeys,
+      final HoodieTable<T> table) {
+    JavaPairRDD<String, String> partitionRecordKeyPairRDD = hoodieKeys
+        .mapToPair(key -> new Tuple2<>(key.getPartitionPath(), key.getRecordKey()));

    // Lookup indexes for all the partition/recordkey pair
-    JavaPairRDD<String, String> rowKeyFilenamePairRDD =
-        lookupIndex(partitionRecordKeyPairRDD, table);
+    JavaPairRDD<String, String> rowKeyFilenamePairRDD = lookupIndex(partitionRecordKeyPairRDD,
+        table);

-    JavaPairRDD<String, HoodieKey> rowKeyHoodieKeyPairRDD =
-        hoodieKeys.mapToPair(key -> new Tuple2<>(key.getRecordKey(), key));
+    JavaPairRDD<String, HoodieKey> rowKeyHoodieKeyPairRDD = hoodieKeys
+        .mapToPair(key -> new Tuple2<>(key.getRecordKey(), key));

-    return rowKeyHoodieKeyPairRDD.leftOuterJoin(rowKeyFilenamePairRDD)
-        .mapToPair(keyPathTuple -> {
+    return rowKeyHoodieKeyPairRDD.leftOuterJoin(rowKeyFilenamePairRDD).mapToPair(keyPathTuple -> {
      Optional<String> recordLocationPath;
      if (keyPathTuple._2._2.isPresent()) {
        String fileName = keyPathTuple._2._2.get();
        String partitionPath = keyPathTuple._2._1.getPartitionPath();
-            recordLocationPath = Optional.of(new Path(
-                new Path(table.getMetaClient().getBasePath(), partitionPath),
-                fileName).toUri().getPath());
+        recordLocationPath = Optional
+            .of(new Path(new Path(table.getMetaClient().getBasePath(), partitionPath), fileName)
+                .toUri().getPath());
      } else {
        recordLocationPath = Optional.absent();
      }
@@ -152,21 +150,21 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
    final Map<String, List<BloomIndexFileInfo>> partitionToFileInfo = fileInfoList.stream()
        .collect(groupingBy(Tuple2::_1, mapping(Tuple2::_2, toList())));

-    // Step 3: Obtain a RDD, for each incoming record, that already exists, with the file id, that contains it.
+    // Step 3: Obtain a RDD, for each incoming record, that already exists, with the file id,
+    // that contains it.
    int parallelism = autoComputeParallelism(recordsPerPartition, partitionToFileInfo,
        partitionRecordKeyPairRDD);
    return findMatchingFilesForRecordKeys(hoodieTable, partitionToFileInfo,
-        partitionRecordKeyPairRDD,
-        parallelism);
+        partitionRecordKeyPairRDD, parallelism);
  }

  /**
   * The index lookup can be skewed in three dimensions : #files, #partitions, #records
-   *
+   * <p>
   * To be able to smoothly handle skews, we need to compute how to split each partitions into
   * subpartitions. We do it here, in a way that keeps the amount of each Spark join partition to <
   * 2GB.
-   *
+   * <p>
   * If {@link com.uber.hoodie.config.HoodieIndexConfig#BLOOM_INDEX_PARALLELISM_PROP} is specified
   * as a NON-zero number, then that is used explicitly.
   */
@@ -184,7 +182,8 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
      // records for a partition.
      Map<String, Long> filesPerPartition = partitionToFileInfo.entrySet().stream()
          .collect(Collectors.toMap(Map.Entry::getKey, e -> Long.valueOf(e.getValue().size())));
-      long totalFiles = 0, totalRecords = 0;
+      long totalFiles = 0;
+      long totalRecords = 0;
      for (String partitionPath : recordsPerPartition.keySet()) {
        long numRecords = recordsPerPartition.get(partitionPath);
        long numFiles =
@@ -210,22 +209,22 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex

  /**
   * Its crucial to pick the right parallelism.
-   *
+   * <p>
   * totalSubPartitions : this is deemed safe limit, to be nice with Spark. inputParallelism :
   * typically number of input file splits
-   *
+   * <p>
   * We pick the max such that, we are always safe, but go higher if say a there are a lot of input
   * files. (otherwise, we will fallback to number of partitions in input and end up with slow
   * performance)
   */
  private int determineParallelism(int inputParallelism, int totalSubPartitions) {
-    // If bloom index parallelism is set, use it to to check against the input parallelism and take the max
+    // If bloom index parallelism is set, use it to to check against the input parallelism and
+    // take the max
    int indexParallelism = Math.max(inputParallelism, config.getBloomIndexParallelism());
    int joinParallelism = Math.max(totalSubPartitions, indexParallelism);
-    logger.info("InputParallelism: ${" + inputParallelism + "}, " +
-        "IndexParallelism: ${" + config.getBloomIndexParallelism() + "}, " +
-        "TotalSubParts: ${" + totalSubPartitions + "}, " +
-        "Join Parallelism set to : " + joinParallelism);
+    logger.info("InputParallelism: ${" + inputParallelism + "}, " + "IndexParallelism: ${" + config
+        .getBloomIndexParallelism() + "}, " + "TotalSubParts: ${" + totalSubPartitions + "}, "
+        + "Join Parallelism set to : " + joinParallelism);
    return joinParallelism;
  }

@@ -237,29 +236,24 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
      final HoodieTable<T> hoodieTable) {
    // Obtain the latest data files from all the partitions.
    List<Tuple2<String, HoodieDataFile>> dataFilesList = jsc
-        .parallelize(partitions, Math.max(partitions.size(), 1))
-        .flatMapToPair(partitionPath -> {
-          java.util.Optional<HoodieInstant> latestCommitTime =
-              hoodieTable.getCommitsTimeline().filterCompletedInstants().lastInstant();
+        .parallelize(partitions, Math.max(partitions.size(), 1)).flatMapToPair(partitionPath -> {
+          java.util.Optional<HoodieInstant> latestCommitTime = hoodieTable.getCommitsTimeline()
+              .filterCompletedInstants().lastInstant();
          List<Tuple2<String, HoodieDataFile>> filteredFiles = new ArrayList<>();
          if (latestCommitTime.isPresent()) {
-            filteredFiles =
-                hoodieTable.getROFileSystemView().getLatestDataFilesBeforeOrOn(partitionPath,
-                    latestCommitTime.get().getTimestamp())
-                    .map(f -> new Tuple2<>(partitionPath, f))
-                    .collect(toList());
+            filteredFiles = hoodieTable.getROFileSystemView()
+                .getLatestDataFilesBeforeOrOn(partitionPath, latestCommitTime.get().getTimestamp())
+                .map(f -> new Tuple2<>(partitionPath, f)).collect(toList());
          }
          return filteredFiles.iterator();
        }).collect();

    if (config.getBloomIndexPruneByRanges()) {
      // also obtain file ranges, if range pruning is enabled
-      return jsc.parallelize(dataFilesList, Math.max(dataFilesList.size(), 1))
-          .mapToPair(ft -> {
+      return jsc.parallelize(dataFilesList, Math.max(dataFilesList.size(), 1)).mapToPair(ft -> {
        try {
          String[] minMaxKeys = ParquetUtils
-                  .readMinMaxRecordKeys(hoodieTable.getHadoopConf(),
-                      ft._2().getFileStatus().getPath());
+              .readMinMaxRecordKeys(hoodieTable.getHadoopConf(), ft._2().getFileStatus().getPath());
          return new Tuple2<>(ft._1(),
              new BloomIndexFileInfo(ft._2().getFileName(), minMaxKeys[0], minMaxKeys[1]));
        } catch (MetadataNotFoundException me) {
@@ -320,21 +314,20 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
   * (e.g: timestamp as prefix), the number of files to be compared gets cut down a lot from range
   * pruning.
   */
-  // sub-partition to ensure the records can be looked up against files & also prune file<=>record comparisons based on recordKey
+  // sub-partition to ensure the records can be looked up against files & also prune
+  // file<=>record comparisons based on recordKey
  // ranges in the index info.
  @VisibleForTesting
  JavaPairRDD<String, Tuple2<String, HoodieKey>> explodeRecordRDDWithFileComparisons(
      final Map<String, List<BloomIndexFileInfo>> partitionToFileIndexInfo,
      JavaPairRDD<String, String> partitionRecordKeyPairRDD) {
-    return partitionRecordKeyPairRDD
-        .map(partitionRecordKeyPair -> {
+    return partitionRecordKeyPairRDD.map(partitionRecordKeyPair -> {
      String recordKey = partitionRecordKeyPair._2();
      String partitionPath = partitionRecordKeyPair._1();

      List<BloomIndexFileInfo> indexInfos = partitionToFileIndexInfo.get(partitionPath);
      List<Tuple2<String, Tuple2<String, HoodieKey>>> recordComparisons = new ArrayList<>();
-          if (indexInfos
-              != null) { // could be null, if there are no files in a given partition yet.
+      if (indexInfos != null) { // could be null, if there are no files in a given partition yet.
        // for each candidate file in partition, that needs to be compared.
        for (BloomIndexFileInfo indexInfo : indexInfos) {
          if (shouldCompareWithFile(indexInfo, recordKey)) {
@@ -346,35 +339,34 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
        }
      }
      return recordComparisons;
-        })
-        .flatMapToPair(t -> t.iterator());
+    }).flatMapToPair(t -> t.iterator());
  }

  /**
   * Find out <RowKey, filename> pair. All workload grouped by file-level.
-   *
+   * <p>
   * Join PairRDD(PartitionPath, RecordKey) and PairRDD(PartitionPath, File) & then repartition such
   * that each RDD partition is a file, then for each file, we do (1) load bloom filter, (2) load
   * rowKeys, (3) Tag rowKey
-   *
+   * <p>
   * Make sure the parallelism is atleast the groupby parallelism for tagging location
   */
  @VisibleForTesting
  JavaPairRDD<String, String> findMatchingFilesForRecordKeys(HoodieTable hoodieTable,
      final Map<String, List<BloomIndexFileInfo>> partitionToFileIndexInfo,
-      JavaPairRDD<String, String> partitionRecordKeyPairRDD,
-      int totalSubpartitions) {
+      JavaPairRDD<String, String> partitionRecordKeyPairRDD, int totalSubpartitions) {

    int joinParallelism = determineParallelism(partitionRecordKeyPairRDD.partitions().size(),
        totalSubpartitions);

-    JavaPairRDD<String, Tuple2<String, HoodieKey>> fileSortedTripletRDD = explodeRecordRDDWithFileComparisons(
+    JavaPairRDD<String, Tuple2<String, HoodieKey>> fileSortedTripletRDD =
+        explodeRecordRDDWithFileComparisons(
            partitionToFileIndexInfo, partitionRecordKeyPairRDD)
-        // sort further based on filename, such that all checking for the file can happen within a single partition, on-the-fly
+            // sort further based on filename, such that all checking for the file can happen within
+            // a single partition, on-the-fly
            .sortByKey(true, joinParallelism);

-    return fileSortedTripletRDD
-        .mapPartitionsWithIndex(
+    return fileSortedTripletRDD.mapPartitionsWithIndex(
        new HoodieBloomIndexCheckFunction(hoodieTable, config.getBasePath()), true)
        .flatMap(indexLookupResults -> indexLookupResults.iterator())
        .filter(lookupResult -> lookupResult.getMatchingRecordKeys().size() > 0)
@@ -391,14 +383,13 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
   * Tag the <rowKey, filename> back to the original HoodieRecord RDD.
   */
  private JavaRDD<HoodieRecord<T>> tagLocationBacktoRecords(
-      JavaPairRDD<String, String> rowKeyFilenamePairRDD,
-      JavaRDD<HoodieRecord<T>> recordRDD) {
+      JavaPairRDD<String, String> rowKeyFilenamePairRDD, JavaRDD<HoodieRecord<T>> recordRDD) {
    JavaPairRDD<String, HoodieRecord<T>> rowKeyRecordPairRDD = recordRDD
        .mapToPair(record -> new Tuple2<>(record.getRecordKey(), record));

-    // Here as the recordRDD might have more data than rowKeyRDD (some rowKeys' fileId is null), so we do left outer join.
-    return rowKeyRecordPairRDD.leftOuterJoin(rowKeyFilenamePairRDD).values().map(
-        v1 -> {
+    // Here as the recordRDD might have more data than rowKeyRDD (some rowKeys' fileId is null),
+    // so we do left outer join.
+    return rowKeyRecordPairRDD.leftOuterJoin(rowKeyFilenamePairRDD).values().map(v1 -> {
      HoodieRecord<T> record = v1._1();
      if (v1._2().isPresent()) {
        String filename = v1._2().get();
@@ -408,8 +399,7 @@ public class HoodieBloomIndex<T extends HoodieRecordPayload> extends HoodieIndex
        }
      }
      return record;
-        }
-    );
+    });
  }

  @Override
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/HoodieBloomIndexCheckFunction.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/bloom/HoodieBloomIndexCheckFunction.java
@@ -41,7 +41,8 @@ import scala.Tuple2;
 * actual files
 */
 public class HoodieBloomIndexCheckFunction implements
-    Function2<Integer, Iterator<Tuple2<String, Tuple2<String, HoodieKey>>>, Iterator<List<IndexLookupResult>>> {
+    Function2<Integer, Iterator<Tuple2<String, Tuple2<String, HoodieKey>>>,
+        Iterator<List<IndexLookupResult>>> {

  private static Logger logger = LogManager.getLogger(HoodieBloomIndexCheckFunction.class);

@@ -58,8 +59,7 @@ public class HoodieBloomIndexCheckFunction implements
   * Given a list of row keys and one file, return only row keys existing in that file.
   */
  public static List<String> checkCandidatesAgainstFile(Configuration configuration,
-      List<String> candidateRecordKeys,
-      Path filePath) throws HoodieIndexException {
+      List<String> candidateRecordKeys, Path filePath) throws HoodieIndexException {
    List<String> foundRecordKeys = new ArrayList<>();
    try {
      // Load all rowKeys from the file, to double-confirm
@@ -86,6 +86,13 @@ public class HoodieBloomIndexCheckFunction implements
    return foundRecordKeys;
  }

+  @Override
+  public Iterator<List<IndexLookupResult>> call(Integer partition,
+      Iterator<Tuple2<String, Tuple2<String, HoodieKey>>> fileParitionRecordKeyTripletItr)
+      throws Exception {
+    return new LazyKeyCheckIterator(fileParitionRecordKeyTripletItr);
+  }
+
  class LazyKeyCheckIterator extends
      LazyIterableIterator<Tuple2<String, Tuple2<String, HoodieKey>>, List<IndexLookupResult>> {

@@ -143,7 +150,8 @@ public class HoodieBloomIndexCheckFunction implements

          // if continue on current file)
          if (fileName.equals(currentFile)) {
-            // check record key against bloom filter of current file & add to possible keys if needed
+            // check record key against bloom filter of current file & add to possible keys if
+            // needed
            if (bloomFilter.mightContain(recordKey)) {
              if (logger.isDebugEnabled()) {
                logger.debug("#1 Adding " + recordKey + " as candidate for file " + fileName);
@@ -201,12 +209,4 @@ public class HoodieBloomIndexCheckFunction implements
    protected void end() {
    }
  }
-
-
-  @Override
-  public Iterator<List<IndexLookupResult>> call(Integer partition,
-      Iterator<Tuple2<String, Tuple2<String, HoodieKey>>> fileParitionRecordKeyTripletItr)
-      throws Exception {
-    return new LazyKeyCheckIterator(fileParitionRecordKeyTripletItr);
-  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/bucketed/BucketedIndex.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/bucketed/BucketedIndex.java
@@ -38,9 +38,9 @@ import scala.Tuple2;
 /**
 * An `stateless` index implementation that will using a deterministic mapping function to determine
 * the fileID for a given record.
- *
+ * <p>
 * Pros: - Fast
- *
+ * <p>
 * Cons : - Need to tune the number of buckets per partition path manually (FIXME: Need to autotune
 * this) - Could increase write amplification on copy-on-write storage since inserts always rewrite
 * files - Not global.
--- a/hoodie-client/src/main/java/com/uber/hoodie/index/hbase/HBaseIndex.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/index/hbase/HBaseIndex.java
@@ -27,12 +27,16 @@ import com.uber.hoodie.common.model.HoodieRecordLocation;
 import com.uber.hoodie.common.model.HoodieRecordPayload;
 import com.uber.hoodie.common.table.HoodieTimeline;
 import com.uber.hoodie.common.table.timeline.HoodieInstant;
-import com.uber.hoodie.config.HoodieIndexConfig;
 import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.exception.HoodieDependentSystemUnavailableException;
 import com.uber.hoodie.exception.HoodieIndexException;
 import com.uber.hoodie.index.HoodieIndex;
 import com.uber.hoodie.table.HoodieTable;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Iterator;
+import java.util.LinkedList;
+import java.util.List;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.hbase.HBaseConfiguration;
 import org.apache.hadoop.hbase.TableName;
@@ -51,23 +55,18 @@ import org.apache.spark.api.java.JavaRDD;
 import org.apache.spark.api.java.JavaSparkContext;
 import org.apache.spark.api.java.function.Function2;

-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.Iterator;
-import java.util.LinkedList;
-import java.util.List;
-
 /**
 * Hoodie Index implementation backed by HBase
 */
 public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
-  private final static byte[] SYSTEM_COLUMN_FAMILY = Bytes.toBytes("_s");
-  private final static byte[] COMMIT_TS_COLUMN = Bytes.toBytes("commit_ts");
-  private final static byte[] FILE_NAME_COLUMN = Bytes.toBytes("file_name");
-  private final static byte[] PARTITION_PATH_COLUMN = Bytes.toBytes("partition_path");
+
+  private static final byte[] SYSTEM_COLUMN_FAMILY = Bytes.toBytes("_s");
+  private static final byte[] COMMIT_TS_COLUMN = Bytes.toBytes("commit_ts");
+  private static final byte[] FILE_NAME_COLUMN = Bytes.toBytes("file_name");
+  private static final byte[] PARTITION_PATH_COLUMN = Bytes.toBytes("partition_path");

  private static Logger logger = LogManager.getLogger(HBaseIndex.class);
-
+  private static Connection hbaseConnection = null;
  private final String tableName;

  public HBaseIndex(HoodieWriteConfig config, JavaSparkContext jsc) {
@@ -77,14 +76,12 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
  }

  @Override
-  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(
-      JavaRDD<HoodieKey> hoodieKeys, HoodieTable<T> table) {
+  public JavaPairRDD<HoodieKey, Optional<String>> fetchRecordLocation(JavaRDD<HoodieKey> hoodieKeys,
+      HoodieTable<T> table) {
    //TODO : Change/Remove filterExists in HoodieReadClient() and revisit
    throw new UnsupportedOperationException("HBase index does not implement check exist");
  }

-  private static Connection hbaseConnection = null;
-
  private Connection getHBaseConnection() {
    Configuration hbaseConfig = HBaseConfiguration.create();
    String quorum = config.getHbaseZkQuorum();
@@ -100,8 +97,8 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
  }

  /**
-   * Since we are sharing the HbaseConnection across tasks in a JVM, make sure the HbaseConnectio is closed when
-   * JVM exits
+   * Since we are sharing the HbaseConnection across tasks in a JVM, make sure the HbaseConnectio is
+   * closed when JVM exits
   */
  private void addShutDownHook() {
    Runtime.getRuntime().addShutdownHook(new Thread() {
@@ -126,10 +123,11 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
    HoodieTimeline commitTimeline = hoodieTable.getCompletedCommitTimeline();
    // Check if the last commit ts for this row is 1) present in the timeline or
    // 2) is less than the first commit ts in the timeline
-    return !commitTimeline.empty() && (commitTimeline.containsInstant(
-        new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTs)) ||
-        HoodieTimeline.compareTimestamps(commitTimeline.firstInstant().get().getTimestamp(),
-            commitTs, HoodieTimeline.GREATER));
+    return !commitTimeline.empty() && (commitTimeline
+        .containsInstant(new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTs))
+        || HoodieTimeline
+        .compareTimestamps(commitTimeline.firstInstant().get().getTimestamp(), commitTs,
+            HoodieTimeline.GREATER));
  }

  /**
@@ -171,16 +169,17 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
                  HoodieRecord currentRecord = currentBatchOfRecords.remove(0);
                  if (result.getRow() != null) {
                    String keyFromResult = Bytes.toString(result.getRow());
-                String commitTs =
-                    Bytes.toString(result.getValue(SYSTEM_COLUMN_FAMILY, COMMIT_TS_COLUMN));
-                String fileId =
-                    Bytes.toString(result.getValue(SYSTEM_COLUMN_FAMILY, FILE_NAME_COLUMN));
-                String partitionPath =
-                    Bytes.toString(result.getValue(SYSTEM_COLUMN_FAMILY, PARTITION_PATH_COLUMN));
+                    String commitTs = Bytes
+                        .toString(result.getValue(SYSTEM_COLUMN_FAMILY, COMMIT_TS_COLUMN));
+                    String fileId = Bytes
+                        .toString(result.getValue(SYSTEM_COLUMN_FAMILY, FILE_NAME_COLUMN));
+                    String partitionPath = Bytes
+                        .toString(result.getValue(SYSTEM_COLUMN_FAMILY, PARTITION_PATH_COLUMN));

                    if (checkIfValidCommit(hoodieTable, commitTs)) {
-                  currentRecord = new HoodieRecord(new HoodieKey(currentRecord.getRecordKey(),
-                      partitionPath), currentRecord.getData());
+                      currentRecord = new HoodieRecord(
+                          new HoodieKey(currentRecord.getRecordKey(), partitionPath),
+                          currentRecord.getData());
                      currentRecord.setCurrentLocation(new HoodieRecordLocation(commitTs, fileId));
                      taggedRecords.add(currentRecord);
                      // the key from Result and the key being processed should be same
@@ -217,10 +216,10 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {
    return recordRDD.mapPartitionsWithIndex(locationTagFunction(hoodieTable), true);
  }

-  private Function2<Integer, Iterator<WriteStatus>, Iterator<WriteStatus>> updateLocationFunction() {
-
-    return (Function2<Integer, Iterator<WriteStatus>, Iterator<WriteStatus>>) (partition, statusIterator) -> {
-
+  private Function2<Integer, Iterator<WriteStatus>, Iterator<WriteStatus>>
+      updateLocationFunction() {
+    return (Function2<Integer, Iterator<WriteStatus>, Iterator<WriteStatus>>) (partition,
+        statusIterator) -> {
      Integer multiPutBatchSize = config.getHbaseIndexPutBatchSize();

      List<WriteStatus> writeStatusList = new ArrayList<>();
@@ -292,12 +291,9 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {

  /**
   * Helper method to facilitate performing puts and deletes in Hbase
-   * @param hTable
-   * @param puts
-   * @param deletes
-   * @throws IOException
   */
-  private void doPutsAndDeletes(HTable hTable, List<Put> puts, List<Delete> deletes) throws IOException {
+  private void doPutsAndDeletes(HTable hTable, List<Put> puts, List<Delete> deletes)
+      throws IOException {
    if (puts.size() > 0) {
      hTable.put(puts);
    }
@@ -323,7 +319,6 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {

  /**
   * Only looks up by recordKey
-   * @return
   */
  @Override
  public boolean isGlobal() {
@@ -332,7 +327,6 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {

  /**
   * Mapping is available in HBase already.
-   * @return
   */
  @Override
  public boolean canIndexLogFiles() {
@@ -341,7 +335,6 @@ public class HBaseIndex<T extends HoodieRecordPayload> extends HoodieIndex<T> {

  /**
   * Index needs to be explicitly updated after storage write.
-   * @return
   */
  @Override
  public boolean isImplicitWithStorage() {
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieAppendHandle.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieAppendHandle.java
@@ -37,14 +37,6 @@ import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.exception.HoodieAppendException;
 import com.uber.hoodie.exception.HoodieUpsertException;
 import com.uber.hoodie.table.HoodieTable;
-import org.apache.avro.generic.GenericRecord;
-import org.apache.avro.generic.IndexedRecord;
-import org.apache.hadoop.fs.Path;
-import org.apache.log4j.LogManager;
-import org.apache.log4j.Logger;
-import org.apache.spark.TaskContext;
-import org.apache.spark.util.SizeEstimator;
-
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Comparator;
@@ -53,6 +45,13 @@ import java.util.List;
 import java.util.Map;
 import java.util.Optional;
 import java.util.concurrent.atomic.AtomicLong;
+import org.apache.avro.generic.GenericRecord;
+import org.apache.avro.generic.IndexedRecord;
+import org.apache.hadoop.fs.Path;
+import org.apache.log4j.LogManager;
+import org.apache.log4j.Logger;
+import org.apache.spark.TaskContext;
+import org.apache.spark.util.SizeEstimator;

 /**
 * IO Operation to append data onto an existing file.
@@ -61,14 +60,13 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH

  private static Logger logger = LogManager.getLogger(HoodieAppendHandle.class);
  private static AtomicLong recordIndex = new AtomicLong(1);
-
-  private TableFileSystemView.RealtimeView fileSystemView;
  private final WriteStatus writeStatus;
  private final String fileId;
-  private String partitionPath;
-  private Iterator<HoodieRecord<T>> recordItr;
  List<IndexedRecord> recordList = new ArrayList<>();
  List<String> keysToDelete = new ArrayList<>();
+  private TableFileSystemView.RealtimeView fileSystemView;
+  private String partitionPath;
+  private Iterator<HoodieRecord<T>> recordItr;
  private long recordsWritten = 0;
  private long recordsDeleted = 0;
  private long averageRecordSize = 0;
@@ -76,11 +74,8 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH
  private Writer writer;
  private boolean doInit = true;

-  public HoodieAppendHandle(HoodieWriteConfig config,
-      String commitTime,
-      HoodieTable<T> hoodieTable,
-      String fileId,
-      Iterator<HoodieRecord<T>> recordItr) {
+  public HoodieAppendHandle(HoodieWriteConfig config, String commitTime, HoodieTable<T> hoodieTable,
+      String fileId, Iterator<HoodieRecord<T>> recordItr) {
    super(config, commitTime, hoodieTable);
    WriteStatus writeStatus = ReflectionUtils.loadClass(config.getWriteStatusClassName());
    writeStatus.setStat(new HoodieDeltaWriteStat());
@@ -94,8 +89,8 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH

    // extract some information from the first record
    FileSlice fileSlice = fileSystemView.getLatestFileSlices(partitionPath)
-          .filter(fileSlice1 -> fileSlice1.getDataFile().get().getFileId().equals(fileId))
-          .findFirst().get();
+        .filter(fileSlice1 -> fileSlice1.getDataFile().get().getFileId().equals(fileId)).findFirst()
+        .get();
    // HACK(vc) This also assumes a base file. It will break, if appending without one.
    String latestValidFilePath = fileSlice.getDataFile().get().getFileName();
    String baseCommitTime = FSUtils.getCommitTime(latestValidFilePath);
@@ -108,23 +103,21 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH
    try {
      this.writer = HoodieLogFormat.newWriterBuilder()
          .onParentPath(new Path(hoodieTable.getMetaClient().getBasePath(), partitionPath))
-            .withFileId(fileId).overBaseCommit(baseCommitTime).withLogVersion(fileSlice.getLogFiles()
-                .map(logFile -> logFile.getLogVersion())
+          .withFileId(fileId).overBaseCommit(baseCommitTime).withLogVersion(
+              fileSlice.getLogFiles().map(logFile -> logFile.getLogVersion())
                  .max(Comparator.naturalOrder()).orElse(HoodieLogFile.LOGFILE_BASE_VERSION))
-            .withSizeThreshold(config.getLogFileMaxSize())
-            .withFs(fs).withFileExtension(HoodieLogFile.DELTA_EXTENSION).build();
+          .withSizeThreshold(config.getLogFileMaxSize()).withFs(fs)
+          .withFileExtension(HoodieLogFile.DELTA_EXTENSION).build();
      this.currentLogFile = writer.getLogFile();
-        ((HoodieDeltaWriteStat) writeStatus.getStat())
-            .setLogVersion(currentLogFile.getLogVersion());
-        ((HoodieDeltaWriteStat) writeStatus.getStat())
-            .setLogOffset(writer.getCurrentSize());
+      ((HoodieDeltaWriteStat) writeStatus.getStat()).setLogVersion(currentLogFile.getLogVersion());
+      ((HoodieDeltaWriteStat) writeStatus.getStat()).setLogOffset(writer.getCurrentSize());
    } catch (Exception e) {
      logger.error("Error in update task at commit " + commitTime, e);
      writeStatus.setGlobalError(e);
      throw new HoodieUpsertException(
-            "Failed to initialize HoodieUpdateHandle for FileId: " + fileId
-                + " on commit " + commitTime + " on HDFS path " + hoodieTable
-                .getMetaClient().getBasePath() + partitionPath, e);
+          "Failed to initialize HoodieUpdateHandle for FileId: " + fileId + " on commit "
+              + commitTime + " on HDFS path " + hoodieTable.getMetaClient().getBasePath()
+              + partitionPath, e);
    }
    Path path = new Path(partitionPath,
        FSUtils.makeDataFileName(commitTime, TaskContext.getPartitionId(), fileId));
@@ -150,7 +143,8 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH
      }

      writeStatus.markSuccess(hoodieRecord, recordMetadata);
-      // deflate record payload after recording success. This will help users access payload as a part of marking
+      // deflate record payload after recording success. This will help users access payload as a
+      // part of marking
      // record successful.
      hoodieRecord.deflate();
      return avroRecord;
@@ -165,7 +159,8 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH
  // to make sure we don't append records with older (shorter) schema than already appended
  public void doAppend() {

-    int maxBlockSize = config.getLogFileDataBlockMaxSize(); int numberOfRecords = 0;
+    int maxBlockSize = config.getLogFileDataBlockMaxSize();
+    int numberOfRecords = 0;
    Map<HoodieLogBlock.HeaderMetadataType, String> header = Maps.newHashMap();
    header.put(HoodieLogBlock.HeaderMetadataType.INSTANT_TIME, commitTime);
    header.put(HoodieLogBlock.HeaderMetadataType.SCHEMA, schema.toString());
@@ -180,7 +175,8 @@ public class HoodieAppendHandle<T extends HoodieRecordPayload> extends HoodieIOH
      }
      // Append if max number of records reached to achieve block size
      if (numberOfRecords >= (int) (maxBlockSize / averageRecordSize)) {
-        // Recompute averageRecordSize before writing a new block and update existing value with avg of new and old
+        // Recompute averageRecordSize before writing a new block and update existing value with
+        // avg of new and old
        logger.info("AvgRecordSize => " + averageRecordSize);
        averageRecordSize = (averageRecordSize + SizeEstimator.estimate(record)) / 2;
        doAppend(header);
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCleanHelper.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCleanHelper.java
@@ -68,8 +68,7 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
      throws IOException {
    logger.info("Cleaning " + partitionPath + ", retaining latest " + config
        .getCleanerFileVersionsRetained() + " file versions. ");
-    List<HoodieFileGroup> fileGroups =
-        fileSystemView.getAllFileGroups(partitionPath)
+    List<HoodieFileGroup> fileGroups = fileSystemView.getAllFileGroups(partitionPath)
        .collect(Collectors.toList());
    List<String> deletePaths = new ArrayList<>();
    // Collect all the datafiles savepointed by all the savepoints
@@ -94,11 +93,9 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
        FileSlice nextSlice = fileSliceIterator.next();
        HoodieDataFile dataFile = nextSlice.getDataFile().get();
        deletePaths.add(dataFile.getFileStatus().getPath().toString());
-        if (hoodieTable.getMetaClient().getTableType()
-            == HoodieTableType.MERGE_ON_READ) {
+        if (hoodieTable.getMetaClient().getTableType() == HoodieTableType.MERGE_ON_READ) {
          // If merge on read, then clean the log files for the commits as well
-          deletePaths.addAll(nextSlice.getLogFiles()
-              .map(file -> file.getPath().toString())
+          deletePaths.addAll(nextSlice.getLogFiles().map(file -> file.getPath().toString())
              .collect(Collectors.toList()));
        }
      }
@@ -121,8 +118,8 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
  private List<String> getFilesToCleanKeepingLatestCommits(String partitionPath)
      throws IOException {
    int commitsRetained = config.getCleanerCommitsRetained();
-    logger.info(
-        "Cleaning " + partitionPath + ", retaining latest " + commitsRetained + " commits. ");
+    logger
+        .info("Cleaning " + partitionPath + ", retaining latest " + commitsRetained + " commits. ");
    List<String> deletePaths = new ArrayList<>();

    // Collect all the datafiles savepointed by all the savepoints
@@ -132,15 +129,14 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
    // determine if we have enough commits, to start cleaning.
    if (commitTimeline.countInstants() > commitsRetained) {
      HoodieInstant earliestCommitToRetain = getEarliestCommitToRetain().get();
-      List<HoodieFileGroup> fileGroups =
-          fileSystemView.getAllFileGroups(partitionPath)
+      List<HoodieFileGroup> fileGroups = fileSystemView.getAllFileGroups(partitionPath)
          .collect(Collectors.toList());
      for (HoodieFileGroup fileGroup : fileGroups) {
        List<FileSlice> fileSliceList = fileGroup.getAllFileSlices().collect(Collectors.toList());
        HoodieDataFile dataFile = fileSliceList.get(0).getDataFile().get();
        String lastVersion = dataFile.getCommitTime();
-        String lastVersionBeforeEarliestCommitToRetain =
-            getLatestVersionBeforeCommit(fileSliceList, earliestCommitToRetain);
+        String lastVersionBeforeEarliestCommitToRetain = getLatestVersionBeforeCommit(fileSliceList,
+            earliestCommitToRetain);

        // Ensure there are more than 1 version of the file (we only clean old files from updates)
        // i.e always spare the last commit.
@@ -151,28 +147,26 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
            // do not clean up a savepoint data file
            continue;
          }
-          // Dont delete the latest commit and also the last commit before the earliest commit we are retaining
-          // The window of commit retain == max query run time. So a query could be running which still
+          // Dont delete the latest commit and also the last commit before the earliest commit we
+          // are retaining
+          // The window of commit retain == max query run time. So a query could be running which
+          // still
          // uses this file.
-          if (fileCommitTime.equals(lastVersion) || (
-              lastVersionBeforeEarliestCommitToRetain != null && fileCommitTime
-                  .equals(lastVersionBeforeEarliestCommitToRetain))) {
+          if (fileCommitTime.equals(lastVersion) || (lastVersionBeforeEarliestCommitToRetain != null
+              && fileCommitTime.equals(lastVersionBeforeEarliestCommitToRetain))) {
            // move on to the next file
            continue;
          }

          // Always keep the last commit
-          if (HoodieTimeline.compareTimestamps(
-              earliestCommitToRetain.getTimestamp(),
-              fileCommitTime,
+          if (HoodieTimeline
+              .compareTimestamps(earliestCommitToRetain.getTimestamp(), fileCommitTime,
                  HoodieTimeline.GREATER)) {
            // this is a commit, that should be cleaned.
            deletePaths.add(aFile.getFileStatus().getPath().toString());
-            if (hoodieTable.getMetaClient().getTableType()
-                == HoodieTableType.MERGE_ON_READ) {
+            if (hoodieTable.getMetaClient().getTableType() == HoodieTableType.MERGE_ON_READ) {
              // If merge on read, then clean the log files for the commits as well
-              deletePaths.addAll(aSlice.getLogFiles()
-                  .map(file -> file.getPath().toString())
+              deletePaths.addAll(aSlice.getLogFiles().map(file -> file.getPath().toString())
                  .collect(Collectors.toList()));
            }
          }
@@ -190,9 +184,10 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
      HoodieInstant commitTime) {
    for (FileSlice file : fileSliceList) {
      String fileCommitTime = file.getDataFile().get().getCommitTime();
-      if (HoodieTimeline.compareTimestamps(commitTime.getTimestamp(), fileCommitTime,
-          HoodieTimeline.GREATER)) {
-        // fileList is sorted on the reverse, so the first commit we find <= commitTime is the one we want
+      if (HoodieTimeline
+          .compareTimestamps(commitTime.getTimestamp(), fileCommitTime, HoodieTimeline.GREATER)) {
+        // fileList is sorted on the reverse, so the first commit we find <= commitTime is the
+        // one we want
        return fileCommitTime;
      }
    }
@@ -213,8 +208,7 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
    } else {
      throw new IllegalArgumentException("Unknown cleaning policy : " + policy.name());
    }
-    logger.info(
-        deletePaths.size() + " patterns used to delete in partition path:" + partitionPath);
+    logger.info(deletePaths.size() + " patterns used to delete in partition path:" + partitionPath);

    return deletePaths;
  }
@@ -227,8 +221,8 @@ public class HoodieCleanHelper<T extends HoodieRecordPayload<T>> {
    int commitsRetained = config.getCleanerCommitsRetained();
    if (config.getCleanerPolicy() == HoodieCleaningPolicy.KEEP_LATEST_COMMITS
        && commitTimeline.countInstants() > commitsRetained) {
-      earliestCommitToRetain =
-          commitTimeline.nthInstant(commitTimeline.countInstants() - commitsRetained);
+      earliestCommitToRetain = commitTimeline
+          .nthInstant(commitTimeline.countInstants() - commitsRetained);
    }
    return earliestCommitToRetain;
  }
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCommitArchiveLog.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCommitArchiveLog.java
@@ -40,13 +40,6 @@ import com.uber.hoodie.exception.HoodieCommitException;
 import com.uber.hoodie.exception.HoodieException;
 import com.uber.hoodie.exception.HoodieIOException;
 import com.uber.hoodie.table.HoodieTable;
-import org.apache.avro.Schema;
-import org.apache.avro.file.DataFileStream;
-import org.apache.avro.generic.IndexedRecord;
-import org.apache.hadoop.fs.Path;
-import org.apache.log4j.LogManager;
-import org.apache.log4j.Logger;
-
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.List;
@@ -54,6 +47,11 @@ import java.util.Map;
 import java.util.Optional;
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
+import org.apache.avro.Schema;
+import org.apache.avro.generic.IndexedRecord;
+import org.apache.hadoop.fs.Path;
+import org.apache.log4j.LogManager;
+import org.apache.log4j.Logger;

 /**
 * Archiver to bound the growth of <action>.commit files
@@ -76,11 +74,9 @@ public class HoodieCommitArchiveLog {
  private HoodieLogFormat.Writer openWriter() {
    try {
      if (this.writer == null) {
-        return HoodieLogFormat.newWriterBuilder()
-            .onParentPath(archiveFilePath.getParent())
+        return HoodieLogFormat.newWriterBuilder().onParentPath(archiveFilePath.getParent())
            .withFileId(archiveFilePath.getName())
-            .withFileExtension(HoodieArchivedLogFile.ARCHIVE_EXTENSION)
-            .withFs(metaClient.getFs())
+            .withFileExtension(HoodieArchivedLogFile.ARCHIVE_EXTENSION).withFs(metaClient.getFs())
            .overBaseCommit("").build();
      } else {
        return this.writer;
@@ -136,21 +132,19 @@ public class HoodieCommitArchiveLog {
        .getTimelineOfActions(Sets.newHashSet(HoodieTimeline.CLEAN_ACTION))
        .filterCompletedInstants();
    Stream<HoodieInstant> instants = cleanAndRollbackTimeline.getInstants()
-        .collect(Collectors.groupingBy(s -> s.getAction()))
-        .entrySet()
-        .stream()
-        .map(i -> {
+        .collect(Collectors.groupingBy(s -> s.getAction())).entrySet().stream().map(i -> {
          if (i.getValue().size() > maxCommitsToKeep) {
            return i.getValue().subList(0, i.getValue().size() - minCommitsToKeep);
          } else {
            return new ArrayList<HoodieInstant>();
          }
-        })
-        .flatMap(i -> i.stream());
+        }).flatMap(i -> i.stream());

-    //TODO (na) : Add a way to return actions associated with a timeline and then merge/unify with logic above to avoid Stream.concats
+    //TODO (na) : Add a way to return actions associated with a timeline and then merge/unify
+    // with logic above to avoid Stream.concats
    HoodieTimeline commitTimeline = table.getCompletedCommitTimeline();
-    // We cannot have any holes in the commit timeline. We cannot archive any commits which are made after the first savepoint present.
+    // We cannot have any holes in the commit timeline. We cannot archive any commits which are
+    // made after the first savepoint present.
    Optional<HoodieInstant> firstSavepoint = table.getCompletedSavepointTimeline().firstInstant();
    if (!commitTimeline.empty() && commitTimeline.countInstants() > maxCommitsToKeep) {
      // Actually do the commits
@@ -169,16 +163,14 @@ public class HoodieCommitArchiveLog {
    log.info("Deleting instants " + archivedInstants);
    boolean success = true;
    for (HoodieInstant archivedInstant : archivedInstants) {
-      Path commitFile =
-          new Path(metaClient.getMetaPath(), archivedInstant.getFileName());
+      Path commitFile = new Path(metaClient.getMetaPath(), archivedInstant.getFileName());
      try {
        if (metaClient.getFs().exists(commitFile)) {
          success &= metaClient.getFs().delete(commitFile, false);
          log.info("Archived and deleted instant file " + commitFile);
        }
      } catch (IOException e) {
-        throw new HoodieIOException("Failed to delete archived instant " + archivedInstant,
-            e);
+        throw new HoodieIOException("Failed to delete archived instant " + archivedInstant, e);
      }
    }
    return success;
@@ -186,8 +178,8 @@ public class HoodieCommitArchiveLog {

  public void archive(List<HoodieInstant> instants) throws HoodieCommitException {
    try {
-      HoodieTimeline commitTimeline =
-          metaClient.getActiveTimeline().getAllCommitsTimeline().filterCompletedInstants();
+      HoodieTimeline commitTimeline = metaClient.getActiveTimeline().getAllCommitsTimeline()
+          .filterCompletedInstants();
      Schema wrapperSchema = HoodieArchivedMetaEntry.getClassSchema();
      log.info("Wrapper schema " + wrapperSchema.toString());
      List<IndexedRecord> records = new ArrayList<>();
@@ -247,6 +239,8 @@ public class HoodieCommitArchiveLog {
        archivedMetaWrapper.setActionType(ActionType.commit.name());
        break;
      }
+      default:
+        throw new UnsupportedOperationException("Action not fully supported yet");
    }
    return archivedMetaWrapper;
  }
@@ -256,9 +250,8 @@ public class HoodieCommitArchiveLog {
    ObjectMapper mapper = new ObjectMapper();
    //Need this to ignore other public get() methods
    mapper.configure(DeserializationFeature.FAIL_ON_UNKNOWN_PROPERTIES, false);
-    com.uber.hoodie.avro.model.HoodieCommitMetadata avroMetaData =
-        mapper.convertValue(hoodieCommitMetadata,
-            com.uber.hoodie.avro.model.HoodieCommitMetadata.class);
+    com.uber.hoodie.avro.model.HoodieCommitMetadata avroMetaData = mapper
+        .convertValue(hoodieCommitMetadata, com.uber.hoodie.avro.model.HoodieCommitMetadata.class);
    return avroMetaData;
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCreateHandle.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieCreateHandle.java
@@ -49,8 +49,8 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH
  private long recordsWritten = 0;
  private long recordsDeleted = 0;

-  public HoodieCreateHandle(HoodieWriteConfig config, String commitTime,
-      HoodieTable<T> hoodieTable, String partitionPath) {
+  public HoodieCreateHandle(HoodieWriteConfig config, String commitTime, HoodieTable<T> hoodieTable,
+      String partitionPath) {
    super(config, commitTime, hoodieTable);
    this.status = ReflectionUtils.loadClass(config.getWriteStatusClassName());
    status.setFileId(UUID.randomUUID().toString());
@@ -64,13 +64,10 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH
    }

    try {
-      HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(fs,
-          commitTime,
-          new Path(config.getBasePath()),
-          new Path(config.getBasePath(), partitionPath));
+      HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(fs, commitTime,
+          new Path(config.getBasePath()), new Path(config.getBasePath(), partitionPath));
      partitionMetadata.trySave(TaskContext.getPartitionId());
-      this.storageWriter =
-          HoodieStorageWriterFactory
+      this.storageWriter = HoodieStorageWriterFactory
          .getStorageWriter(commitTime, getStorageWriterPath(), hoodieTable, config, schema);
    } catch (IOException e) {
      throw new HoodieInsertException(
@@ -81,13 +78,12 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH

  /**
   * Determines whether we can accept the incoming records, into the current file, depending on
-   *
+   * <p>
   * - Whether it belongs to the same partitionPath as existing records - Whether the current file
   * written bytes lt max file size
   */
  public boolean canWrite(HoodieRecord record) {
-    return storageWriter.canWrite() && record.getPartitionPath()
-        .equals(status.getPartitionPath());
+    return storageWriter.canWrite() && record.getPartitionPath().equals(status.getPartitionPath());
  }

  /**
@@ -111,7 +107,8 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH
        recordsDeleted++;
      }
      status.markSuccess(record, recordMetadata);
-      // deflate record payload after recording success. This will help users access payload as a part of marking
+      // deflate record payload after recording success. This will help users access payload as a
+      // part of marking
      // record successful.
      record.deflate();
    } catch (Throwable t) {
@@ -126,8 +123,7 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH
   * Performs actions to durably, persist the current changes and returns a WriteStatus object
   */
  public WriteStatus close() {
-    logger.info(
-        "Closing the file " + status.getFileId() + " as we are done with all the records "
+    logger.info("Closing the file " + status.getFileId() + " as we are done with all the records "
        + recordsWritten);
    try {
      storageWriter.close();
@@ -144,8 +140,7 @@ public class HoodieCreateHandle<T extends HoodieRecordPayload> extends HoodieIOH

      return status;
    } catch (IOException e) {
-      throw new HoodieInsertException("Failed to close the Insert Handle for path " + path,
-          e);
+      throw new HoodieInsertException("Failed to close the Insert Handle for path " + path, e);
    }
  }

--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieIOHandle.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieIOHandle.java
@@ -39,11 +39,10 @@ public abstract class HoodieIOHandle<T extends HoodieRecordPayload> {
  protected final HoodieWriteConfig config;
  protected final FileSystem fs;
  protected final HoodieTable<T> hoodieTable;
-  protected HoodieTimeline hoodieTimeline;
  protected final Schema schema;
+  protected HoodieTimeline hoodieTimeline;

-  public HoodieIOHandle(HoodieWriteConfig config, String commitTime,
-      HoodieTable<T> hoodieTable) {
+  public HoodieIOHandle(HoodieWriteConfig config, String commitTime, HoodieTable<T> hoodieTable) {
    this.commitTime = commitTime;
    this.config = config;
    this.fs = hoodieTable.getMetaClient().getFs();
@@ -52,6 +51,32 @@ public abstract class HoodieIOHandle<T extends HoodieRecordPayload> {
    this.schema = createHoodieWriteSchema(config);
  }

+  /**
+   * Deletes any new tmp files written during the current commit, into the partition
+   */
+  public static void cleanupTmpFilesFromCurrentCommit(HoodieWriteConfig config, String commitTime,
+      String partitionPath, int taskPartitionId, HoodieTable hoodieTable) {
+    FileSystem fs = hoodieTable.getMetaClient().getFs();
+    try {
+      FileStatus[] prevFailedFiles = fs.globStatus(new Path(String
+          .format("%s/%s/%s", config.getBasePath(), partitionPath,
+              FSUtils.maskWithoutFileId(commitTime, taskPartitionId))));
+      if (prevFailedFiles != null) {
+        logger.info(
+            "Deleting " + prevFailedFiles.length + " files generated by previous failed attempts.");
+        for (FileStatus status : prevFailedFiles) {
+          fs.delete(status.getPath(), false);
+        }
+      }
+    } catch (IOException e) {
+      throw new HoodieIOException("Failed to cleanup Temp files from commit " + commitTime, e);
+    }
+  }
+
+  public static Schema createHoodieWriteSchema(HoodieWriteConfig config) {
+    return HoodieAvroUtils.addMetadataFields(new Schema.Parser().parse(config.getSchema()));
+  }
+
  public Path makeNewPath(String partitionPath, int taskPartitionId, String fileName) {
    Path path = new Path(config.getBasePath(), partitionPath);
    try {
@@ -72,37 +97,7 @@ public abstract class HoodieIOHandle<T extends HoodieRecordPayload> {
            taskAttemptId));
  }

-  /**
-   * Deletes any new tmp files written during the current commit, into the partition
-   */
-  public static void cleanupTmpFilesFromCurrentCommit(HoodieWriteConfig config,
-      String commitTime,
-      String partitionPath,
-      int taskPartitionId,
-      HoodieTable hoodieTable) {
-    FileSystem fs = hoodieTable.getMetaClient().getFs();
-    try {
-      FileStatus[] prevFailedFiles = fs.globStatus(new Path(String
-          .format("%s/%s/%s", config.getBasePath(), partitionPath,
-              FSUtils.maskWithoutFileId(commitTime, taskPartitionId))));
-      if (prevFailedFiles != null) {
-        logger.info("Deleting " + prevFailedFiles.length
-            + " files generated by previous failed attempts.");
-        for (FileStatus status : prevFailedFiles) {
-          fs.delete(status.getPath(), false);
-        }
-      }
-    } catch (IOException e) {
-      throw new HoodieIOException("Failed to cleanup Temp files from commit " + commitTime,
-          e);
-    }
-  }
-
  public Schema getSchema() {
    return schema;
  }
-
-  public static Schema createHoodieWriteSchema(HoodieWriteConfig config) {
-    return HoodieAvroUtils.addMetadataFields(new Schema.Parser().parse(config.getSchema()));
-  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieMergeHandle.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/HoodieMergeHandle.java
@@ -26,14 +26,18 @@ import com.uber.hoodie.common.table.TableFileSystemView;
 import com.uber.hoodie.common.util.FSUtils;
 import com.uber.hoodie.common.util.ReflectionUtils;
 import com.uber.hoodie.common.util.collection.ExternalSpillableMap;
-import com.uber.hoodie.common.util.collection.converter.StringConverter;
 import com.uber.hoodie.common.util.collection.converter.HoodieRecordConverter;
+import com.uber.hoodie.common.util.collection.converter.StringConverter;
 import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.exception.HoodieIOException;
 import com.uber.hoodie.exception.HoodieUpsertException;
 import com.uber.hoodie.io.storage.HoodieStorageWriter;
 import com.uber.hoodie.io.storage.HoodieStorageWriterFactory;
 import com.uber.hoodie.table.HoodieTable;
+import java.io.IOException;
+import java.util.Iterator;
+import java.util.Map;
+import java.util.Optional;
 import org.apache.avro.generic.GenericRecord;
 import org.apache.avro.generic.IndexedRecord;
 import org.apache.hadoop.fs.Path;
@@ -41,11 +45,6 @@ import org.apache.log4j.LogManager;
 import org.apache.log4j.Logger;
 import org.apache.spark.TaskContext;

-import java.io.IOException;
-import java.util.Iterator;
-import java.util.Map;
-import java.util.Optional;
-
@SuppressWarnings("Duplicates")
 public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHandle<T> {

@@ -62,59 +61,46 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
  private long recordsDeleted = 0;
  private long updatedRecordsWritten = 0;

-  public HoodieMergeHandle(HoodieWriteConfig config,
-      String commitTime,
-      HoodieTable<T> hoodieTable,
-      Iterator<HoodieRecord<T>> recordItr,
-      String fileId) {
+  public HoodieMergeHandle(HoodieWriteConfig config, String commitTime, HoodieTable<T> hoodieTable,
+      Iterator<HoodieRecord<T>> recordItr, String fileId) {
    super(config, commitTime, hoodieTable);
    this.fileSystemView = hoodieTable.getROFileSystemView();
    init(fileId, init(fileId, recordItr));
  }

-  public HoodieMergeHandle(HoodieWriteConfig config,
-                           String commitTime,
-                           HoodieTable<T> hoodieTable,
-                           Map<String, HoodieRecord<T>> keyToNewRecords,
-                           String fileId) {
+  public HoodieMergeHandle(HoodieWriteConfig config, String commitTime, HoodieTable<T> hoodieTable,
+      Map<String, HoodieRecord<T>> keyToNewRecords, String fileId) {
    super(config, commitTime, hoodieTable);
    this.fileSystemView = hoodieTable.getROFileSystemView();
    this.keyToNewRecords = keyToNewRecords;
-    init(fileId, keyToNewRecords.get(keyToNewRecords.keySet().stream().findFirst().get()).getPartitionPath());
+    init(fileId, keyToNewRecords.get(keyToNewRecords.keySet().stream().findFirst().get())
+        .getPartitionPath());
  }

  /**
   * Extract old file path, initialize StorageWriter and WriteStatus
-   * @param fileId
-   * @param partitionPath
   */
  private void init(String fileId, String partitionPath) {
    WriteStatus writeStatus = ReflectionUtils.loadClass(config.getWriteStatusClassName());
    writeStatus.setStat(new HoodieWriteStat());
    this.writeStatus = writeStatus;
    try {
-      String latestValidFilePath = fileSystemView
-          .getLatestDataFiles(partitionPath)
-          .filter(dataFile -> dataFile.getFileId().equals(fileId))
-          .findFirst()
-          .get().getFileName();
+      String latestValidFilePath = fileSystemView.getLatestDataFiles(partitionPath)
+          .filter(dataFile -> dataFile.getFileId().equals(fileId)).findFirst().get().getFileName();
      writeStatus.getStat().setPrevCommit(FSUtils.getCommitTime(latestValidFilePath));

-      HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(fs,
-          commitTime,
-          new Path(config.getBasePath()),
-          new Path(config.getBasePath(), partitionPath));
+      HoodiePartitionMetadata partitionMetadata = new HoodiePartitionMetadata(fs, commitTime,
+          new Path(config.getBasePath()), new Path(config.getBasePath(), partitionPath));
      partitionMetadata.trySave(TaskContext.getPartitionId());

      oldFilePath = new Path(
-          config.getBasePath() + "/" + partitionPath + "/"
-              + latestValidFilePath);
+          config.getBasePath() + "/" + partitionPath + "/" + latestValidFilePath);
      String relativePath = new Path(partitionPath + "/" + FSUtils
          .makeDataFileName(commitTime, TaskContext.getPartitionId(), fileId)).toString();
      newFilePath = new Path(config.getBasePath(), relativePath);
      if (config.shouldUseTempFolderForCopyOnWriteForMerge()) {
-        this.tempPath = makeTempPath(partitionPath, TaskContext.getPartitionId(),
-           fileId, TaskContext.get().stageId(), TaskContext.get().taskAttemptId());
+        this.tempPath = makeTempPath(partitionPath, TaskContext.getPartitionId(), fileId,
+            TaskContext.get().stageId(), TaskContext.get().taskAttemptId());
      }

      // handle cases of partial failures, for update task
@@ -122,8 +108,9 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
        fs.delete(newFilePath, false);
      }

-      logger.info(String.format("Merging new data into oldPath %s, as newPath %s",
-          oldFilePath.toString(), getStorageWriterPath().toString()));
+      logger.info(String
+          .format("Merging new data into oldPath %s, as newPath %s", oldFilePath.toString(),
+              getStorageWriterPath().toString()));
      // file name is same for all records, in this bunch
      writeStatus.setFileId(fileId);
      writeStatus.setPartitionPath(partitionPath);
@@ -143,9 +130,6 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa

  /**
   * Load the new incoming records in a map and return partitionPath
-   * @param fileId
-   * @param newRecordsItr
-   * @return
   */
  private String init(String fileId, Iterator<HoodieRecord<T>> newRecordsItr) {
    try {
@@ -164,14 +148,14 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
      // update the new location of the record, so we know where to find it next
      record.setNewLocation(new HoodieRecordLocation(commitTime, fileId));
    }
-    logger.debug("Number of entries in MemoryBasedMap => " +
-        ((ExternalSpillableMap) keyToNewRecords).getInMemoryMapNumEntries()
-        + "Total size in bytes of MemoryBasedMap => " +
-        ((ExternalSpillableMap) keyToNewRecords).getCurrentInMemoryMapSize()
-        + "Number of entries in DiskBasedMap => " +
-        ((ExternalSpillableMap) keyToNewRecords).getDiskBasedMapNumEntries()
-        + "Size of file spilled to disk => " +
-        ((ExternalSpillableMap) keyToNewRecords).getSizeOfFileOnDiskInBytes());
+    logger.debug("Number of entries in MemoryBasedMap => "
+        + ((ExternalSpillableMap) keyToNewRecords).getInMemoryMapNumEntries()
+        + "Total size in bytes of MemoryBasedMap => "
+        + ((ExternalSpillableMap) keyToNewRecords).getCurrentInMemoryMapSize()
+        + "Number of entries in DiskBasedMap => "
+        + ((ExternalSpillableMap) keyToNewRecords).getDiskBasedMapNumEntries()
+        + "Size of file spilled to disk => "
+        + ((ExternalSpillableMap) keyToNewRecords).getSizeOfFileOnDiskInBytes());

    return partitionPath;
  }
@@ -189,7 +173,8 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
      }

      writeStatus.markSuccess(hoodieRecord, recordMetadata);
-      // deflate record payload after recording success. This will help users access payload as a part of marking
+      // deflate record payload after recording success. This will help users access payload as a
+      // part of marking
      // record successful.
      hoodieRecord.deflate();
      return true;
@@ -201,8 +186,7 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
  }

  /**
-   * Go through an old record. Here if we detect a newer version shows up, we write the new one to
-   * the file.
+   * Go through an old record. Here if we detect a newer version shows up, we write the new one to the file.
   */
  public void write(GenericRecord oldRecord) {
    String key = oldRecord.get(HoodieRecord.RECORD_KEY_METADATA_FIELD).toString();
@@ -236,8 +220,7 @@ public class HoodieMergeHandle<T extends HoodieRecordPayload> extends HoodieIOHa
      try {
        storageWriter.writeAvro(key, oldRecord);
      } catch (ClassCastException e) {
-        logger.error(
-            "Schema mismatch when rewriting old record " + oldRecord + " from file "
+        logger.error("Schema mismatch when rewriting old record " + oldRecord + " from file "
            + getOldFilePath() + " to file " + getStorageWriterPath() + " with schema " + schema
            .toString(true));
        throw new HoodieUpsertException(errMsg, e);
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/CompactionOperation.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/CompactionOperation.java
@@ -53,8 +53,8 @@ public class CompactionOperation implements Serializable {
    this.partitionPath = partitionPath;
    this.dataFileCommitTime = dataFile.getCommitTime();
    this.dataFileSize = dataFile.getFileSize();
-    this.deltaFilePaths = logFiles.stream().map(s -> s.getPath().toString()).collect(
-        Collectors.toList());
+    this.deltaFilePaths = logFiles.stream().map(s -> s.getPath().toString())
+        .collect(Collectors.toList());
    this.metrics = writeConfig.getCompactionStrategy()
        .captureMetrics(dataFile, partitionPath, logFiles);
  }
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/HoodieCompactor.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/HoodieCompactor.java
@@ -17,17 +17,15 @@
 package com.uber.hoodie.io.compact;

 import com.uber.hoodie.WriteStatus;
-import com.uber.hoodie.common.model.HoodieCommitMetadata;
 import com.uber.hoodie.common.table.HoodieTimeline;
 import com.uber.hoodie.common.table.timeline.HoodieActiveTimeline;
 import com.uber.hoodie.common.table.timeline.HoodieInstant;
 import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.table.HoodieTable;
-import org.apache.spark.api.java.JavaRDD;
-import org.apache.spark.api.java.JavaSparkContext;
-
 import java.io.Serializable;
 import java.util.Date;
+import org.apache.spark.api.java.JavaRDD;
+import org.apache.spark.api.java.JavaSparkContext;

 /**
 * A HoodieCompactor runs compaction on a hoodie table
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/HoodieRealtimeTableCompactor.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/HoodieRealtimeTableCompactor.java
@@ -17,6 +17,7 @@
 package com.uber.hoodie.io.compact;

 import static java.util.stream.Collectors.toList;
+
 import com.google.common.base.Preconditions;
 import com.google.common.collect.Lists;
 import com.google.common.collect.Sets;
@@ -70,9 +71,8 @@ public class HoodieRealtimeTableCompactor implements HoodieCompactor {
  }

  private JavaRDD<WriteStatus> executeCompaction(JavaSparkContext jsc,
-      List<CompactionOperation> operations,
-      HoodieTable hoodieTable,
-      HoodieWriteConfig config, String compactionCommitTime) throws IOException {
+      List<CompactionOperation> operations, HoodieTable hoodieTable, HoodieWriteConfig config,
+      String compactionCommitTime) throws IOException {

    log.info("After filtering, Compacting " + operations + " files");
    return jsc.parallelize(operations, operations.size())
@@ -80,18 +80,19 @@ public class HoodieRealtimeTableCompactor implements HoodieCompactor {
        .flatMap(writeStatusesItr -> writeStatusesItr.iterator());
  }

-  private List<WriteStatus> compact(HoodieTable hoodieTable,
-      HoodieWriteConfig config, CompactionOperation operation, String commitTime)
-      throws IOException {
+  private List<WriteStatus> compact(HoodieTable hoodieTable, HoodieWriteConfig config,
+      CompactionOperation operation, String commitTime) throws IOException {
    FileSystem fs = hoodieTable.getMetaClient().getFs();
-    Schema readerSchema =
-        HoodieAvroUtils.addMetadataFields(new Schema.Parser().parse(config.getSchema()));
+    Schema readerSchema = HoodieAvroUtils
+        .addMetadataFields(new Schema.Parser().parse(config.getSchema()));

    log.info("Compacting base " + operation.getDataFilePath() + " with delta files " + operation
        .getDeltaFilePaths() + " for commit " + commitTime);
    // TODO - FIX THIS
-    // Reads the entire avro file. Always only specific blocks should be read from the avro file (failure recover).
-    // Load all the delta commits since the last compaction commit and get all the blocks to be loaded and load it using CompositeAvroLogReader
+    // Reads the entire avro file. Always only specific blocks should be read from the avro file
+    // (failure recover).
+    // Load all the delta commits since the last compaction commit and get all the blocks to be
+    // loaded and load it using CompositeAvroLogReader
    // Since a DeltaCommit is not defined yet, reading all the records. revisit this soon.
    HoodieTableMetaClient metaClient = hoodieTable.getMetaClient();
    String maxInstantTime = metaClient.getActiveTimeline()
@@ -114,25 +115,22 @@ public class HoodieRealtimeTableCompactor implements HoodieCompactor {
    Iterator<List<WriteStatus>> result = table
        .handleUpdate(commitTime, operation.getFileId(), scanner.getRecords());
    Iterable<List<WriteStatus>> resultIterable = () -> result;
-    return StreamSupport.stream(resultIterable.spliterator(), false)
-        .flatMap(Collection::stream)
+    return StreamSupport.stream(resultIterable.spliterator(), false).flatMap(Collection::stream)
        .map(s -> {
          s.getStat().setTotalRecordsToBeUpdate(scanner.getTotalRecordsToUpdate());
          s.getStat().setTotalLogFiles(scanner.getTotalLogFiles());
          s.getStat().setTotalLogRecords(scanner.getTotalLogRecords());
          s.getStat().setPartitionPath(operation.getPartitionPath());
          return s;
-        })
-        .collect(toList());
+        }).collect(toList());
  }

  private List<CompactionOperation> getCompactionWorkload(JavaSparkContext jsc,
-      HoodieTable hoodieTable,
-      HoodieWriteConfig config, String compactionCommitTime)
+      HoodieTable hoodieTable, HoodieWriteConfig config, String compactionCommitTime)
      throws IOException {

-    Preconditions.checkArgument(
-        hoodieTable.getMetaClient().getTableType() == HoodieTableType.MERGE_ON_READ,
+    Preconditions
+        .checkArgument(hoodieTable.getMetaClient().getTableType() == HoodieTableType.MERGE_ON_READ,
            "HoodieRealtimeTableCompactor can only compact table of type "
                + HoodieTableType.MERGE_ON_READ + " and not " + hoodieTable.getMetaClient()
                .getTableType().name());
@@ -141,25 +139,23 @@ public class HoodieRealtimeTableCompactor implements HoodieCompactor {
    // TODO - rollback any compactions in flight
    HoodieTableMetaClient metaClient = hoodieTable.getMetaClient();
    log.info("Compacting " + metaClient.getBasePath() + " with commit " + compactionCommitTime);
-    List<String> partitionPaths =
-        FSUtils.getAllPartitionPaths(metaClient.getFs(), metaClient.getBasePath(),
+    List<String> partitionPaths = FSUtils
+        .getAllPartitionPaths(metaClient.getFs(), metaClient.getBasePath(),
            config.shouldAssumeDatePartitioning());

    TableFileSystemView.RealtimeView fileSystemView = hoodieTable.getRTFileSystemView();
    log.info("Compaction looking for files to compact in " + partitionPaths + " partitions");
-    List<CompactionOperation> operations =
-        jsc.parallelize(partitionPaths, partitionPaths.size())
+    List<CompactionOperation> operations = jsc.parallelize(partitionPaths, partitionPaths.size())
        .flatMap((FlatMapFunction<String, CompactionOperation>) partitionPath -> fileSystemView
-                .getLatestFileSlices(partitionPath)
-                .map(s -> new CompactionOperation(s.getDataFile().get(),
-                    partitionPath,
+            .getLatestFileSlices(partitionPath).map(
+                s -> new CompactionOperation(s.getDataFile().get(), partitionPath,
                    s.getLogFiles().sorted(HoodieLogFile.getLogVersionComparator().reversed())
                        .collect(Collectors.toList()), config))
-                .filter(c -> !c.getDeltaFilePaths().isEmpty())
-                .collect(toList()).iterator()).collect();
+            .filter(c -> !c.getDeltaFilePaths().isEmpty()).collect(toList()).iterator()).collect();
    log.info("Total of " + operations.size() + " compactions are retrieved");

-    // Filter the compactions with the passed in filter. This lets us choose most effective compactions only
+    // Filter the compactions with the passed in filter. This lets us choose most effective
+    // compactions only
    operations = config.getCompactionStrategy().orderAndFilter(config, operations);
    if (operations.isEmpty()) {
      log.warn("After filtering, Nothing to compact for " + metaClient.getBasePath());
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/BoundedIOCompactionStrategy.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/BoundedIOCompactionStrategy.java
@@ -44,9 +44,9 @@ public class BoundedIOCompactionStrategy implements CompactionStrategy {
      List<HoodieLogFile> logFiles) {
    Map<String, Object> metrics = Maps.newHashMap();
    // Total size of all the log files
-    Long totalLogFileSize = logFiles.stream().map(HoodieLogFile::getFileSize).filter(
-        Optional::isPresent).map(Optional::get).reduce(
-        (size1, size2) -> size1 + size2).orElse(0L);
+    Long totalLogFileSize = logFiles.stream().map(HoodieLogFile::getFileSize)
+        .filter(Optional::isPresent).map(Optional::get).reduce((size1, size2) -> size1 + size2)
+        .orElse(0L);
    // Total read will be the base file + all the log files
    Long totalIORead = FSUtils.getSizeInMB(dataFile.getFileSize() + totalLogFileSize);
    // Total write will be similar to the size of the base file
@@ -64,7 +64,8 @@ public class BoundedIOCompactionStrategy implements CompactionStrategy {
  @Override
  public List<CompactionOperation> orderAndFilter(HoodieWriteConfig writeConfig,
      List<CompactionOperation> operations) {
-    // Iterate through the operations in order and accept operations as long as we are within the IO limit
+    // Iterate through the operations in order and accept operations as long as we are within the
+    // IO limit
    // Preserves the original ordering of compactions
    List<CompactionOperation> finalOperations = Lists.newArrayList();
    long targetIORemaining = writeConfig.getTargetIOPerCompactionInMB();
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/CompactionStrategy.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/CompactionStrategy.java
@@ -28,7 +28,7 @@ import java.util.Map;
 * Strategy for compaction. Pluggable implementation of define how compaction should be done. The
 * implementations of this interface can capture the relevant metrics to order and filter the final
 * list of compaction operation to run in a single compaction.
- *
+ * <p>
 * Implementation of CompactionStrategy cannot hold any state. Difference instantiations can be
 * passed in every time
 *
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/DayBasedCompactionStrategy.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/DayBasedCompactionStrategy.java
@@ -20,7 +20,6 @@ package com.uber.hoodie.io.compact.strategy;
 import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.exception.HoodieException;
 import com.uber.hoodie.io.compact.CompactionOperation;
-
 import java.text.ParseException;
 import java.text.SimpleDateFormat;
 import java.util.Comparator;
@@ -30,15 +29,16 @@ import java.util.Locale;
 import java.util.stream.Collectors;

 /**
- * This strategy orders compactions in reverse order of creation of Hive Partitions.
- * It helps to compact data in latest partitions first and then older capped at the Total_IO allowed.
+ * This strategy orders compactions in reverse order of creation of Hive Partitions. It helps to
+ * compact data in latest partitions first and then older capped at the Total_IO allowed.
 */
 public class DayBasedCompactionStrategy extends BoundedIOCompactionStrategy {

  // For now, use SimpleDateFormat as default partition format
  private static String datePartitionFormat = "yyyy/MM/dd";
  // Sorts compaction in LastInFirstCompacted order
-  private static Comparator<CompactionOperation> comparator = (CompactionOperation leftC, CompactionOperation rightC) -> {
+  private static Comparator<CompactionOperation> comparator = (CompactionOperation leftC,
+      CompactionOperation rightC) -> {
    try {
      Date left = new SimpleDateFormat(datePartitionFormat, Locale.ENGLISH)
          .parse(leftC.getPartitionPath());
@@ -55,8 +55,10 @@ public class DayBasedCompactionStrategy extends BoundedIOCompactionStrategy {
  }

  @Override
-  public List<CompactionOperation> orderAndFilter(HoodieWriteConfig writeConfig, List<CompactionOperation> operations) {
+  public List<CompactionOperation> orderAndFilter(HoodieWriteConfig writeConfig,
+      List<CompactionOperation> operations) {
    // Iterate through the operations and accept operations as long as we are within the IO limit
-    return super.orderAndFilter(writeConfig, operations.stream().sorted(comparator).collect(Collectors.toList()));
+    return super.orderAndFilter(writeConfig,
+        operations.stream().sorted(comparator).collect(Collectors.toList()));
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/LogFileSizeBasedCompactionStrategy.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/compact/strategy/LogFileSizeBasedCompactionStrategy.java
@@ -44,9 +44,9 @@ public class LogFileSizeBasedCompactionStrategy extends BoundedIOCompactionStrat

    Map<String, Object> metrics = super.captureMetrics(dataFile, partitionPath, logFiles);
    // Total size of all the log files
-    Long totalLogFileSize = logFiles.stream().map(HoodieLogFile::getFileSize).filter(
-        Optional::isPresent).map(Optional::get).reduce(
-        (size1, size2) -> size1 + size2).orElse(0L);
+    Long totalLogFileSize = logFiles.stream().map(HoodieLogFile::getFileSize)
+        .filter(Optional::isPresent).map(Optional::get).reduce((size1, size2) -> size1 + size2)
+        .orElse(0L);
    // save the metrics needed during the order
    metrics.put(TOTAL_LOG_FILE_SIZE, totalLogFileSize);
    return metrics;
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieParquetWriter.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieParquetWriter.java
@@ -36,8 +36,8 @@ import org.apache.spark.TaskContext;
 * HoodieParquetWriter extends the ParquetWriter to help limit the size of underlying file. Provides
 * a way to check if the current file can take more records with the <code>canWrite()</code>
 */
-public class HoodieParquetWriter<T extends HoodieRecordPayload, R extends IndexedRecord>
-    extends ParquetWriter<IndexedRecord> implements HoodieStorageWriter<R> {
+public class HoodieParquetWriter<T extends HoodieRecordPayload, R extends IndexedRecord> extends
+    ParquetWriter<IndexedRecord> implements HoodieStorageWriter<R> {

  private static AtomicLong recordIndex = new AtomicLong(1);

@@ -49,6 +49,29 @@ public class HoodieParquetWriter<T extends HoodieRecordPayload, R extends Indexe
  private final Schema schema;


+  public HoodieParquetWriter(String commitTime, Path file, HoodieParquetConfig parquetConfig,
+      Schema schema) throws IOException {
+    super(HoodieWrapperFileSystem.convertToHoodiePath(file, parquetConfig.getHadoopConf()),
+        ParquetFileWriter.Mode.CREATE, parquetConfig.getWriteSupport(),
+        parquetConfig.getCompressionCodecName(), parquetConfig.getBlockSize(),
+        parquetConfig.getPageSize(), parquetConfig.getPageSize(),
+        ParquetWriter.DEFAULT_IS_DICTIONARY_ENABLED, ParquetWriter.DEFAULT_IS_VALIDATING_ENABLED,
+        ParquetWriter.DEFAULT_WRITER_VERSION,
+        registerFileSystem(file, parquetConfig.getHadoopConf()));
+    this.file = HoodieWrapperFileSystem.convertToHoodiePath(file, parquetConfig.getHadoopConf());
+    this.fs = (HoodieWrapperFileSystem) this.file
+        .getFileSystem(registerFileSystem(file, parquetConfig.getHadoopConf()));
+    // We cannot accurately measure the snappy compressed output file size. We are choosing a
+    // conservative 10%
+    // TODO - compute this compression ratio dynamically by looking at the bytes written to the
+    // stream and the actual file size reported by HDFS
+    this.maxFileSize = parquetConfig.getMaxFileSize() + Math
+        .round(parquetConfig.getMaxFileSize() * parquetConfig.getCompressionRatio());
+    this.writeSupport = parquetConfig.getWriteSupport();
+    this.commitTime = commitTime;
+    this.schema = schema;
+  }
+
  private static Configuration registerFileSystem(Path file, Configuration conf) {
    Configuration returnConf = new Configuration(conf);
    String scheme = FSUtils.getFs(file.toString(), conf).getScheme();
@@ -57,37 +80,12 @@ public class HoodieParquetWriter<T extends HoodieRecordPayload, R extends Indexe
    return returnConf;
  }

-  public HoodieParquetWriter(String commitTime, Path file,
-      HoodieParquetConfig parquetConfig, Schema schema) throws IOException {
-    super(HoodieWrapperFileSystem.convertToHoodiePath(file, parquetConfig.getHadoopConf()),
-        ParquetFileWriter.Mode.CREATE, parquetConfig.getWriteSupport(),
-        parquetConfig.getCompressionCodecName(), parquetConfig.getBlockSize(),
-        parquetConfig.getPageSize(), parquetConfig.getPageSize(),
-        ParquetWriter.DEFAULT_IS_DICTIONARY_ENABLED,
-        ParquetWriter.DEFAULT_IS_VALIDATING_ENABLED, ParquetWriter.DEFAULT_WRITER_VERSION,
-        registerFileSystem(file, parquetConfig.getHadoopConf()));
-    this.file =
-        HoodieWrapperFileSystem.convertToHoodiePath(file, parquetConfig.getHadoopConf());
-    this.fs = (HoodieWrapperFileSystem) this.file
-        .getFileSystem(registerFileSystem(file, parquetConfig.getHadoopConf()));
-    // We cannot accurately measure the snappy compressed output file size. We are choosing a conservative 10%
-    // TODO - compute this compression ratio dynamically by looking at the bytes written to the stream and the actual file size reported by HDFS
-    this.maxFileSize = parquetConfig.getMaxFileSize() + Math
-        .round(parquetConfig.getMaxFileSize() * parquetConfig.getCompressionRatio());
-    this.writeSupport = parquetConfig.getWriteSupport();
-    this.commitTime = commitTime;
-    this.schema = schema;
-  }
-
-
  @Override
  public void writeAvroWithMetadata(R avroRecord, HoodieRecord record) throws IOException {
    String seqId = HoodieRecord.generateSequenceId(commitTime, TaskContext.getPartitionId(),
        recordIndex.getAndIncrement());
-    HoodieAvroUtils.addHoodieKeyToRecord((GenericRecord) avroRecord,
-        record.getRecordKey(),
-        record.getPartitionPath(),
-        file.getName());
+    HoodieAvroUtils.addHoodieKeyToRecord((GenericRecord) avroRecord, record.getRecordKey(),
+        record.getPartitionPath(), file.getName());
    HoodieAvroUtils.addCommitMetadataToRecord((GenericRecord) avroRecord, commitTime, seqId);
    super.write(avroRecord);
    writeSupport.add(record.getRecordKey());
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieStorageWriterFactory.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieStorageWriterFactory.java
@@ -30,22 +30,22 @@ import org.apache.parquet.hadoop.metadata.CompressionCodecName;

 public class HoodieStorageWriterFactory {

-  public static <T extends HoodieRecordPayload, R extends IndexedRecord> HoodieStorageWriter<R> getStorageWriter(
-      String commitTime, Path path, HoodieTable<T> hoodieTable, HoodieWriteConfig config,
-      Schema schema)
-      throws IOException {
+  public static <T extends HoodieRecordPayload, R extends IndexedRecord> HoodieStorageWriter<R>
+      getStorageWriter(String commitTime, Path path, HoodieTable<T> hoodieTable,
+      HoodieWriteConfig config, Schema schema) throws IOException {
    //TODO - based on the metadata choose the implementation of HoodieStorageWriter
    // Currently only parquet is supported
    return newParquetStorageWriter(commitTime, path, config, schema, hoodieTable);
  }

-  private static <T extends HoodieRecordPayload, R extends IndexedRecord> HoodieStorageWriter<R> newParquetStorageWriter(
+  private static <T extends HoodieRecordPayload, R extends IndexedRecord> HoodieStorageWriter<R>
+      newParquetStorageWriter(
      String commitTime, Path path, HoodieWriteConfig config, Schema schema,
      HoodieTable hoodieTable) throws IOException {
-    BloomFilter filter =
-        new BloomFilter(config.getBloomFilterNumEntries(), config.getBloomFilterFPP());
-    HoodieAvroWriteSupport writeSupport =
-        new HoodieAvroWriteSupport(new AvroSchemaConverter().convert(schema), schema, filter);
+    BloomFilter filter = new BloomFilter(config.getBloomFilterNumEntries(),
+        config.getBloomFilterFPP());
+    HoodieAvroWriteSupport writeSupport = new HoodieAvroWriteSupport(
+        new AvroSchemaConverter().convert(schema), schema, filter);

    HoodieParquetConfig parquetConfig =
        new HoodieParquetConfig(writeSupport, CompressionCodecName.GZIP,
--- a/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieWrapperFileSystem.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/io/storage/HoodieWrapperFileSystem.java
@@ -59,8 +59,8 @@ import org.apache.hadoop.util.Progressable;
 */
 public class HoodieWrapperFileSystem extends FileSystem {

-  private static final Set<String> SUPPORT_SCHEMES;
  public static final String HOODIE_SCHEME_PREFIX = "hoodie-";
+  private static final Set<String> SUPPORT_SCHEMES;

  static {
    SUPPORT_SCHEMES = new HashSet<>();
@@ -69,18 +69,50 @@ public class HoodieWrapperFileSystem extends FileSystem {
    SUPPORT_SCHEMES.add("s3");
    SUPPORT_SCHEMES.add("s3a");

-
    // Hoodie currently relies on underlying object store being fully
    // consistent so only regional buckets should be used.
    SUPPORT_SCHEMES.add("gs");
    SUPPORT_SCHEMES.add("viewfs");
  }

-  private ConcurrentMap<String, SizeAwareFSDataOutputStream> openStreams =
-      new ConcurrentHashMap<>();
+  private ConcurrentMap<String, SizeAwareFSDataOutputStream> openStreams = new
+      ConcurrentHashMap<>();
  private FileSystem fileSystem;
  private URI uri;

+  public static Path convertToHoodiePath(Path file, Configuration conf) {
+    try {
+      String scheme = FSUtils.getFs(file.toString(), conf).getScheme();
+      return convertPathWithScheme(file, getHoodieScheme(scheme));
+    } catch (HoodieIOException e) {
+      throw e;
+    }
+  }
+
+  private static Path convertPathWithScheme(Path oldPath, String newScheme) {
+    URI oldURI = oldPath.toUri();
+    URI newURI;
+    try {
+      newURI = new URI(newScheme, oldURI.getUserInfo(), oldURI.getHost(), oldURI.getPort(),
+          oldURI.getPath(), oldURI.getQuery(), oldURI.getFragment());
+      return new Path(newURI);
+    } catch (URISyntaxException e) {
+      // TODO - Better Exception handling
+      throw new RuntimeException(e);
+    }
+  }
+
+  public static String getHoodieScheme(String scheme) {
+    String newScheme;
+    if (SUPPORT_SCHEMES.contains(scheme)) {
+      newScheme = HOODIE_SCHEME_PREFIX + scheme;
+    } else {
+      throw new IllegalArgumentException(
+          "BlockAlignedAvroParquetWriter does not support scheme " + scheme);
+    }
+    return newScheme;
+  }
+
  @Override
  public void initialize(URI uri, Configuration conf) throws IOException {
    // Get the default filesystem to decorate
@@ -90,7 +122,8 @@ public class HoodieWrapperFileSystem extends FileSystem {
      path = new Path(path.toString().replace(HOODIE_SCHEME_PREFIX, ""));
    }
    this.fileSystem = FSUtils.getFs(path.toString(), conf);
-    // Do not need to explicitly initialize the default filesystem, its done already in the above FileSystem.get
+    // Do not need to explicitly initialize the default filesystem, its done already in the above
+    // FileSystem.get
    // fileSystem.initialize(FileSystem.getDefaultUri(conf), conf);
    // fileSystem.setConf(conf);
    this.uri = uri;
@@ -108,8 +141,7 @@ public class HoodieWrapperFileSystem extends FileSystem {

  @Override
  public FSDataOutputStream create(Path f, FsPermission permission, boolean overwrite,
-      int bufferSize, short replication, long blockSize, Progressable progress)
-      throws IOException {
+      int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
    final Path translatedPath = convertToDefaultPath(f);
    return wrapOutputStream(f, fileSystem
        .create(translatedPath, permission, overwrite, bufferSize, replication, blockSize,
@@ -122,8 +154,8 @@ public class HoodieWrapperFileSystem extends FileSystem {
      return fsDataOutputStream;
    }

-    SizeAwareFSDataOutputStream os =
-        new SizeAwareFSDataOutputStream(fsDataOutputStream, new Runnable() {
+    SizeAwareFSDataOutputStream os = new SizeAwareFSDataOutputStream(fsDataOutputStream,
+        new Runnable() {
          @Override
          public void run() {
            openStreams.remove(path.getName());
@@ -160,14 +192,13 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize)
-      throws IOException {
+  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize) throws IOException {
    return fileSystem.create(convertToDefaultPath(f), overwrite, bufferSize);
  }

  @Override
-  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize,
-      Progressable progress) throws IOException {
+  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, Progressable progress)
+      throws IOException {
    return fileSystem.create(convertToDefaultPath(f), overwrite, bufferSize, progress);
  }

@@ -175,14 +206,12 @@ public class HoodieWrapperFileSystem extends FileSystem {
  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, short replication,
      long blockSize, Progressable progress) throws IOException {
    return fileSystem
-        .create(convertToDefaultPath(f), overwrite, bufferSize, replication, blockSize,
-            progress);
+        .create(convertToDefaultPath(f), overwrite, bufferSize, replication, blockSize, progress);
  }

  @Override
  public FSDataOutputStream create(Path f, FsPermission permission, EnumSet<CreateFlag> flags,
-      int bufferSize, short replication, long blockSize, Progressable progress)
-      throws IOException {
+      int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
    return fileSystem
        .create(convertToDefaultPath(f), permission, flags, bufferSize, replication, blockSize,
            progress);
@@ -197,7 +226,6 @@ public class HoodieWrapperFileSystem extends FileSystem {
            progress, checksumOpt);
  }

-
  @Override
  public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, short replication,
      long blockSize) throws IOException {
@@ -205,7 +233,6 @@ public class HoodieWrapperFileSystem extends FileSystem {
        .create(convertToDefaultPath(f), overwrite, bufferSize, replication, blockSize);
  }

-
  @Override
  public FSDataOutputStream append(Path f, int bufferSize, Progressable progress)
      throws IOException {
@@ -228,13 +255,13 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public void setWorkingDirectory(Path new_dir) {
-    fileSystem.setWorkingDirectory(convertToDefaultPath(new_dir));
+  public Path getWorkingDirectory() {
+    return convertToHoodiePath(fileSystem.getWorkingDirectory());
  }

  @Override
-  public Path getWorkingDirectory() {
-    return convertToHoodiePath(fileSystem.getWorkingDirectory());
+  public void setWorkingDirectory(Path newDir) {
+    fileSystem.setWorkingDirectory(convertToDefaultPath(newDir));
  }

  @Override
@@ -290,8 +317,7 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public BlockLocation[] getFileBlockLocations(Path p, long start, long len)
-      throws IOException {
+  public BlockLocation[] getFileBlockLocations(Path p, long start, long len) throws IOException {
    return fileSystem.getFileBlockLocations(convertToDefaultPath(p), start, len);
  }

@@ -319,17 +345,16 @@ public class HoodieWrapperFileSystem extends FileSystem {
  public FSDataOutputStream createNonRecursive(Path f, boolean overwrite, int bufferSize,
      short replication, long blockSize, Progressable progress) throws IOException {
    return fileSystem
-        .createNonRecursive(convertToDefaultPath(f), overwrite, bufferSize, replication,
-            blockSize, progress);
+        .createNonRecursive(convertToDefaultPath(f), overwrite, bufferSize, replication, blockSize,
+            progress);
  }

  @Override
  public FSDataOutputStream createNonRecursive(Path f, FsPermission permission, boolean overwrite,
-      int bufferSize, short replication, long blockSize, Progressable progress)
-      throws IOException {
+      int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
    return fileSystem
-        .createNonRecursive(convertToDefaultPath(f), permission, overwrite, bufferSize,
-            replication, blockSize, progress);
+        .createNonRecursive(convertToDefaultPath(f), permission, overwrite, bufferSize, replication,
+            blockSize, progress);
  }

  @Override
@@ -418,20 +443,17 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public FileStatus[] listStatus(Path f, PathFilter filter)
-      throws IOException {
+  public FileStatus[] listStatus(Path f, PathFilter filter) throws IOException {
    return fileSystem.listStatus(convertToDefaultPath(f), filter);
  }

  @Override
-  public FileStatus[] listStatus(Path[] files)
-      throws IOException {
+  public FileStatus[] listStatus(Path[] files) throws IOException {
    return fileSystem.listStatus(convertDefaults(files));
  }

  @Override
-  public FileStatus[] listStatus(Path[] files, PathFilter filter)
-      throws IOException {
+  public FileStatus[] listStatus(Path[] files, PathFilter filter) throws IOException {
    return fileSystem.listStatus(convertDefaults(files), filter);
  }

@@ -441,20 +463,17 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public FileStatus[] globStatus(Path pathPattern, PathFilter filter)
-      throws IOException {
+  public FileStatus[] globStatus(Path pathPattern, PathFilter filter) throws IOException {
    return fileSystem.globStatus(convertToDefaultPath(pathPattern), filter);
  }

  @Override
-  public RemoteIterator<LocatedFileStatus> listLocatedStatus(Path f)
-      throws IOException {
+  public RemoteIterator<LocatedFileStatus> listLocatedStatus(Path f) throws IOException {
    return fileSystem.listLocatedStatus(convertToDefaultPath(f));
  }

  @Override
-  public RemoteIterator<LocatedFileStatus> listFiles(Path f, boolean recursive)
-      throws IOException {
+  public RemoteIterator<LocatedFileStatus> listFiles(Path f, boolean recursive) throws IOException {
    return fileSystem.listFiles(convertToDefaultPath(f), recursive);
  }

@@ -498,8 +517,8 @@ public class HoodieWrapperFileSystem extends FileSystem {
  @Override
  public void copyFromLocalFile(boolean delSrc, boolean overwrite, Path src, Path dst)
      throws IOException {
-    fileSystem.copyFromLocalFile(delSrc, overwrite, convertToDefaultPath(src),
-        convertToDefaultPath(dst));
+    fileSystem
+        .copyFromLocalFile(delSrc, overwrite, convertToDefaultPath(src), convertToDefaultPath(dst));
  }

  @Override
@@ -525,15 +544,13 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public Path startLocalOutput(Path fsOutputFile, Path tmpLocalFile)
-      throws IOException {
-    return convertToHoodiePath(fileSystem.startLocalOutput(convertToDefaultPath(fsOutputFile),
-        convertToDefaultPath(tmpLocalFile)));
+  public Path startLocalOutput(Path fsOutputFile, Path tmpLocalFile) throws IOException {
+    return convertToHoodiePath(fileSystem
+        .startLocalOutput(convertToDefaultPath(fsOutputFile), convertToDefaultPath(tmpLocalFile)));
  }

  @Override
-  public void completeLocalOutput(Path fsOutputFile, Path tmpLocalFile)
-      throws IOException {
+  public void completeLocalOutput(Path fsOutputFile, Path tmpLocalFile) throws IOException {
    fileSystem.completeLocalOutput(convertToDefaultPath(fsOutputFile),
        convertToDefaultPath(tmpLocalFile));
  }
@@ -574,23 +591,18 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public void access(Path path, FsAction mode)
-      throws IOException {
+  public void access(Path path, FsAction mode) throws IOException {
    fileSystem.access(convertToDefaultPath(path), mode);
  }

  @Override
-  public void createSymlink(Path target, Path link, boolean createParent)
-      throws
-      IOException {
+  public void createSymlink(Path target, Path link, boolean createParent) throws IOException {
    fileSystem
        .createSymlink(convertToDefaultPath(target), convertToDefaultPath(link), createParent);
  }

  @Override
-  public FileStatus getFileLinkStatus(Path f)
-      throws
-      IOException {
+  public FileStatus getFileLinkStatus(Path f) throws IOException {
    return fileSystem.getFileLinkStatus(convertToDefaultPath(f));
  }

@@ -651,8 +663,7 @@ public class HoodieWrapperFileSystem extends FileSystem {

  @Override
  public Path createSnapshot(Path path, String snapshotName) throws IOException {
-    return convertToHoodiePath(
-        fileSystem.createSnapshot(convertToDefaultPath(path), snapshotName));
+    return convertToHoodiePath(fileSystem.createSnapshot(convertToDefaultPath(path), snapshotName));
  }

  @Override
@@ -718,8 +729,7 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public Map<String, byte[]> getXAttrs(Path path, List<String> names)
-      throws IOException {
+  public Map<String, byte[]> getXAttrs(Path path, List<String> names) throws IOException {
    return fileSystem.getXAttrs(convertToDefaultPath(path), names);
  }

@@ -734,13 +744,13 @@ public class HoodieWrapperFileSystem extends FileSystem {
  }

  @Override
-  public void setConf(Configuration conf) {
-    // ignore this. we will set conf on init
+  public Configuration getConf() {
+    return fileSystem.getConf();
  }

  @Override
-  public Configuration getConf() {
-    return fileSystem.getConf();
+  public void setConf(Configuration conf) {
+    // ignore this. we will set conf on init
  }

  @Override
@@ -762,15 +772,6 @@ public class HoodieWrapperFileSystem extends FileSystem {
    return convertPathWithScheme(oldPath, getHoodieScheme(fileSystem.getScheme()));
  }

-  public static Path convertToHoodiePath(Path file, Configuration conf) {
-    try {
-      String scheme = FSUtils.getFs(file.toString(), conf).getScheme();
-      return convertPathWithScheme(file, getHoodieScheme(scheme));
-    } catch (HoodieIOException e) {
-      throw e;
-    }
-  }
-
  private Path convertToDefaultPath(Path oldPath) {
    return convertPathWithScheme(oldPath, fileSystem.getScheme());
  }
@@ -783,30 +784,6 @@ public class HoodieWrapperFileSystem extends FileSystem {
    return psrcsNew;
  }

-  private static Path convertPathWithScheme(Path oldPath, String newScheme) {
-    URI oldURI = oldPath.toUri();
-    URI newURI;
-    try {
-      newURI = new URI(newScheme, oldURI.getUserInfo(), oldURI.getHost(), oldURI.getPort(),
-          oldURI.getPath(), oldURI.getQuery(), oldURI.getFragment());
-      return new Path(newURI);
-    } catch (URISyntaxException e) {
-      // TODO - Better Exception handling
-      throw new RuntimeException(e);
-    }
-  }
-
-  public static String getHoodieScheme(String scheme) {
-    String newScheme;
-    if (SUPPORT_SCHEMES.contains(scheme)) {
-      newScheme = HOODIE_SCHEME_PREFIX + scheme;
-    } else {
-      throw new IllegalArgumentException(
-          "BlockAlignedAvroParquetWriter does not support scheme " + scheme);
-    }
-    return newScheme;
-  }
-
  public long getBytesWritten(Path file) {
    if (openStreams.containsKey(file.getName())) {
      return openStreams.get(file.getName()).getBytesWritten();
--- a/hoodie-client/src/main/java/com/uber/hoodie/metrics/HoodieMetrics.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/metrics/HoodieMetrics.java
@@ -30,14 +30,14 @@ import org.apache.log4j.Logger;
 */
 public class HoodieMetrics {

-  private HoodieWriteConfig config = null;
-  private String tableName = null;
  private static Logger logger = LogManager.getLogger(HoodieMetrics.class);
  // Some timers
  public String rollbackTimerName = null;
  public String cleanTimerName = null;
  public String commitTimerName = null;
  public String finalizeTimerName = null;
+  private HoodieWriteConfig config = null;
+  private String tableName = null;
  private Timer rollbackTimer = null;
  private Timer cleanTimer = null;
  private Timer commitTimer = null;
@@ -113,8 +113,9 @@ public class HoodieMetrics {

  public void updateRollbackMetrics(long durationInMs, long numFilesDeleted) {
    if (config.isMetricsOn()) {
-      logger.info(String.format("Sending rollback metrics (duration=%d, numFilesDeleted=$d)",
-          durationInMs, numFilesDeleted));
+      logger.info(String
+          .format("Sending rollback metrics (duration=%d, numFilesDeleted=$d)", durationInMs,
+              numFilesDeleted));
      registerGauge(getMetricsName("rollback", "duration"), durationInMs);
      registerGauge(getMetricsName("rollback", "numFilesDeleted"), numFilesDeleted);
    }
@@ -122,8 +123,9 @@ public class HoodieMetrics {

  public void updateCleanMetrics(long durationInMs, int numFilesDeleted) {
    if (config.isMetricsOn()) {
-      logger.info(String.format("Sending clean metrics (duration=%d, numFilesDeleted=%d)",
-          durationInMs, numFilesDeleted));
+      logger.info(String
+          .format("Sending clean metrics (duration=%d, numFilesDeleted=%d)", durationInMs,
+              numFilesDeleted));
      registerGauge(getMetricsName("clean", "duration"), durationInMs);
      registerGauge(getMetricsName("clean", "numFilesDeleted"), numFilesDeleted);
    }
@@ -131,7 +133,8 @@ public class HoodieMetrics {

  public void updateFinalizeWriteMetrics(long durationInMs, int numFilesFinalized) {
    if (config.isMetricsOn()) {
-      logger.info(String.format("Sending finalize write metrics (duration=%d, numFilesFinalized=%d)",
+      logger.info(String
+          .format("Sending finalize write metrics (duration=%d, numFilesFinalized=%d)",
              durationInMs, numFilesFinalized));
      registerGauge(getMetricsName("finalize", "duration"), durationInMs);
      registerGauge(getMetricsName("finalize", "numFilesFinalized"), numFilesFinalized);
@@ -140,8 +143,7 @@ public class HoodieMetrics {

  @VisibleForTesting
  String getMetricsName(String action, String metric) {
-    return config == null ? null :
-        String.format("%s.%s.%s", tableName, action, metric);
+    return config == null ? null : String.format("%s.%s.%s", tableName, action, metric);
  }

  void registerGauge(String metricName, final long value) {
@@ -154,7 +156,8 @@ public class HoodieMetrics {
        }
      });
    } catch (Exception e) {
-      // Here we catch all exception, so the major upsert pipeline will not be affected if the metrics system
+      // Here we catch all exception, so the major upsert pipeline will not be affected if the
+      // metrics system
      // has some issues.
      logger.error("Failed to send metrics: ", e);
    }
--- a/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsGraphiteReporter.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsGraphiteReporter.java
@@ -33,14 +33,13 @@ import org.apache.log4j.Logger;
 */
 public class MetricsGraphiteReporter extends MetricsReporter {

+  private static Logger logger = LogManager.getLogger(MetricsGraphiteReporter.class);
  private final MetricRegistry registry;
  private final GraphiteReporter graphiteReporter;
  private final HoodieWriteConfig config;
  private String serverHost;
  private int serverPort;

-  private static Logger logger = LogManager.getLogger(MetricsGraphiteReporter.class);
-
  public MetricsGraphiteReporter(HoodieWriteConfig config, MetricRegistry registry) {
    this.registry = registry;
    this.config = config;
@@ -49,8 +48,8 @@ public class MetricsGraphiteReporter extends MetricsReporter {
    this.serverHost = config.getGraphiteServerHost();
    this.serverPort = config.getGraphiteServerPort();
    if (serverHost == null || serverPort == 0) {
-      throw new RuntimeException(
-          String.format("Graphite cannot be initialized with serverHost[%s] and serverPort[%s].",
+      throw new RuntimeException(String
+          .format("Graphite cannot be initialized with serverHost[%s] and serverPort[%s].",
              serverHost, serverPort));
    }

@@ -81,14 +80,10 @@ public class MetricsGraphiteReporter extends MetricsReporter {
  }

  private GraphiteReporter createGraphiteReport() {
-    Graphite graphite = new Graphite(
-        new InetSocketAddress(serverHost, serverPort));
+    Graphite graphite = new Graphite(new InetSocketAddress(serverHost, serverPort));
    String reporterPrefix = config.getGraphiteMetricPrefix();
-    return GraphiteReporter.forRegistry(registry)
-        .prefixedWith(reporterPrefix)
-        .convertRatesTo(TimeUnit.SECONDS)
-        .convertDurationsTo(TimeUnit.MILLISECONDS)
-        .filter(MetricFilter.ALL)
-        .build(graphite);
+    return GraphiteReporter.forRegistry(registry).prefixedWith(reporterPrefix)
+        .convertRatesTo(TimeUnit.SECONDS).convertDurationsTo(TimeUnit.MILLISECONDS)
+        .filter(MetricFilter.ALL).build(graphite);
  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsReporterFactory.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsReporterFactory.java
@@ -28,8 +28,7 @@ public class MetricsReporterFactory {

  private static Logger logger = LogManager.getLogger(MetricsReporterFactory.class);

-  public static MetricsReporter createReporter(HoodieWriteConfig config,
-      MetricRegistry registry) {
+  public static MetricsReporter createReporter(HoodieWriteConfig config, MetricRegistry registry) {
    MetricsReporterType type = config.getMetricsReporterType();
    MetricsReporter reporter = null;
    switch (type) {
--- a/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsReporterType.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/metrics/MetricsReporterType.java
@@ -21,6 +21,5 @@ package com.uber.hoodie.metrics;
 * future.
 */
 public enum MetricsReporterType {
-  GRAPHITE,
-  INMEMORY
+  GRAPHITE, INMEMORY
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieCopyOnWriteTable.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieCopyOnWriteTable.java
@@ -75,23 +75,425 @@ import scala.Tuple2;

 /**
 * Implementation of a very heavily read-optimized Hoodie Table where
- *
+ * <p>
 * INSERTS - Produce new files, block aligned to desired size (or) Merge with the smallest existing
 * file, to expand it
- *
+ * <p>
 * UPDATES - Produce a new version of the file, just replacing the updated records with new values
 */
 public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends HoodieTable<T> {

+  private static Logger logger = LogManager.getLogger(HoodieCopyOnWriteTable.class);
+
  public HoodieCopyOnWriteTable(HoodieWriteConfig config, HoodieTableMetaClient metaClient) {
    super(config, metaClient);
  }

-  private static Logger logger = LogManager.getLogger(HoodieCopyOnWriteTable.class);
+  private static PairFlatMapFunction<Iterator<Tuple2<String, String>>, String,
+      PartitionCleanStat> deleteFilesFunc(
+      HoodieTable table) {
+    return (PairFlatMapFunction<Iterator<Tuple2<String, String>>, String, PartitionCleanStat>)
+        iter -> {
+          Map<String, PartitionCleanStat> partitionCleanStatMap = new HashMap<>();
+
+          FileSystem fs = table.getMetaClient().getFs();
+          while (iter.hasNext()) {
+            Tuple2<String, String> partitionDelFileTuple = iter.next();
+            String partitionPath = partitionDelFileTuple._1();
+            String deletePathStr = partitionDelFileTuple._2();
+            Boolean deletedFileResult = deleteFileAndGetResult(fs, deletePathStr);
+            if (!partitionCleanStatMap.containsKey(partitionPath)) {
+              partitionCleanStatMap.put(partitionPath, new PartitionCleanStat(partitionPath));
+            }
+            PartitionCleanStat partitionCleanStat = partitionCleanStatMap.get(partitionPath);
+            partitionCleanStat.addDeleteFilePatterns(deletePathStr);
+            partitionCleanStat.addDeletedFileResult(deletePathStr, deletedFileResult);
+          }
+
+          return partitionCleanStatMap.entrySet().stream()
+              .map(e -> new Tuple2<>(e.getKey(), e.getValue()))
+              .collect(Collectors.toList()).iterator();
+        };
+  }
+
+  private static PairFlatMapFunction<String, String, String> getFilesToDeleteFunc(HoodieTable table,
+      HoodieWriteConfig config) {
+    return (PairFlatMapFunction<String, String, String>) partitionPathToClean -> {
+      HoodieCleanHelper cleaner = new HoodieCleanHelper(table, config);
+      return cleaner.getDeletePaths(partitionPathToClean).stream()
+          .map(deleteFile -> new Tuple2<>(partitionPathToClean, deleteFile.toString())).iterator();
+    };
+  }
+
+  private static Boolean deleteFileAndGetResult(FileSystem fs, String deletePathStr)
+      throws IOException {
+    Path deletePath = new Path(deletePathStr);
+    logger.debug("Working on delete path :" + deletePath);
+    boolean deleteResult = fs.delete(deletePath, false);
+    if (deleteResult) {
+      logger.debug("Cleaned file at path :" + deletePath);
+    }
+    return deleteResult;
+  }
+
+  @Override
+  public Partitioner getUpsertPartitioner(WorkloadProfile profile) {
+    if (profile == null) {
+      throw new HoodieUpsertException("Need workload profile to construct the upsert partitioner.");
+    }
+    return new UpsertPartitioner(profile);
+  }
+
+  @Override
+  public Partitioner getInsertPartitioner(WorkloadProfile profile) {
+    return getUpsertPartitioner(profile);
+  }
+
+  @Override
+  public boolean isWorkloadProfileNeeded() {
+    return true;
+  }
+
+  @Override
+  public JavaRDD<WriteStatus> compact(JavaSparkContext jsc, String commitTime) {
+    throw new HoodieNotSupportedException("Compaction is not supported from a CopyOnWrite table");
+  }
+
+  public Iterator<List<WriteStatus>> handleUpdate(String commitTime, String fileLoc,
+      Iterator<HoodieRecord<T>> recordItr) throws IOException {
+    // these are updates
+    HoodieMergeHandle upsertHandle = getUpdateHandle(commitTime, fileLoc, recordItr);
+    return handleUpdateInternal(upsertHandle, commitTime, fileLoc);
+  }
+
+  public Iterator<List<WriteStatus>> handleUpdate(String commitTime, String fileLoc,
+      Map<String, HoodieRecord<T>> keyToNewRecords) throws IOException {
+    // these are updates
+    HoodieMergeHandle upsertHandle = getUpdateHandle(commitTime, fileLoc, keyToNewRecords);
+    return handleUpdateInternal(upsertHandle, commitTime, fileLoc);
+  }
+
+  protected Iterator<List<WriteStatus>> handleUpdateInternal(HoodieMergeHandle upsertHandle,
+      String commitTime, String fileLoc) throws IOException {
+    if (upsertHandle.getOldFilePath() == null) {
+      throw new HoodieUpsertException(
+          "Error in finding the old file path at commit " + commitTime + " at fileLoc: " + fileLoc);
+    } else {
+      AvroReadSupport.setAvroReadSchema(getHadoopConf(), upsertHandle.getSchema());
+      ParquetReader<IndexedRecord> reader = AvroParquetReader.builder(upsertHandle.getOldFilePath())
+          .withConf(getHadoopConf()).build();
+      try {
+        IndexedRecord record;
+        while ((record = reader.read()) != null) {
+          // Two types of writes here (new record, and old record).
+          // We have already catch the exception during writing new records.
+          // But for old records, we should fail if any exception happens.
+          upsertHandle.write((GenericRecord) record);
+        }
+      } catch (IOException e) {
+        throw new HoodieUpsertException(
+            "Failed to read record from " + upsertHandle.getOldFilePath() + " with new Schema "
+                + upsertHandle.getSchema(), e);
+      } finally {
+        reader.close();
+        upsertHandle.close();
+      }
+    }
+    //TODO(vc): This needs to be revisited
+    if (upsertHandle.getWriteStatus().getPartitionPath() == null) {
+      logger.info("Upsert Handle has partition path as null " + upsertHandle.getOldFilePath() + ", "
+          + upsertHandle.getWriteStatus());
+    }
+    return Collections.singletonList(Collections.singletonList(upsertHandle.getWriteStatus()))
+        .iterator();
+  }
+
+  protected HoodieMergeHandle getUpdateHandle(String commitTime, String fileLoc,
+      Iterator<HoodieRecord<T>> recordItr) {
+    return new HoodieMergeHandle<>(config, commitTime, this, recordItr, fileLoc);
+  }
+
+  protected HoodieMergeHandle getUpdateHandle(String commitTime, String fileLoc,
+      Map<String, HoodieRecord<T>> keyToNewRecords) {
+    return new HoodieMergeHandle<>(config, commitTime, this, keyToNewRecords, fileLoc);
+  }
+
+  public Iterator<List<WriteStatus>> handleInsert(String commitTime,
+      Iterator<HoodieRecord<T>> recordItr) throws Exception {
+    return new LazyInsertIterable<>(recordItr, config, commitTime, this);
+  }
+
+  @SuppressWarnings("unchecked")
+  @Override
+  public Iterator<List<WriteStatus>> handleUpsertPartition(String commitTime, Integer partition,
+      Iterator recordItr, Partitioner partitioner) {
+    UpsertPartitioner upsertPartitioner = (UpsertPartitioner) partitioner;
+    BucketInfo binfo = upsertPartitioner.getBucketInfo(partition);
+    BucketType btype = binfo.bucketType;
+    try {
+      if (btype.equals(BucketType.INSERT)) {
+        return handleInsert(commitTime, recordItr);
+      } else if (btype.equals(BucketType.UPDATE)) {
+        return handleUpdate(commitTime, binfo.fileLoc, recordItr);
+      } else {
+        throw new HoodieUpsertException(
+            "Unknown bucketType " + btype + " for partition :" + partition);
+      }
+    } catch (Throwable t) {
+      String msg = "Error upserting bucketType " + btype + " for partition :" + partition;
+      logger.error(msg, t);
+      throw new HoodieUpsertException(msg, t);
+    }
+  }
+
+  @Override
+  public Iterator<List<WriteStatus>> handleInsertPartition(String commitTime, Integer partition,
+      Iterator recordItr, Partitioner partitioner) {
+    return handleUpsertPartition(commitTime, partition, recordItr, partitioner);
+  }
+
+  /**
+   * Performs cleaning of partition paths according to cleaning policy and returns the number of
+   * files cleaned. Handles skews in partitions to clean by making files to clean as the unit of
+   * task distribution.
+   *
+   * @throws IllegalArgumentException if unknown cleaning policy is provided
+   */
+  @Override
+  public List<HoodieCleanStat> clean(JavaSparkContext jsc) {
+    try {
+      FileSystem fs = getMetaClient().getFs();
+      List<String> partitionsToClean = FSUtils
+          .getAllPartitionPaths(fs, getMetaClient().getBasePath(),
+              config.shouldAssumeDatePartitioning());
+      logger.info("Partitions to clean up : " + partitionsToClean + ", with policy " + config
+          .getCleanerPolicy());
+      if (partitionsToClean.isEmpty()) {
+        logger.info("Nothing to clean here mom. It is already clean");
+        return Collections.emptyList();
+      }
+      return cleanPartitionPaths(partitionsToClean, jsc);
+    } catch (IOException e) {
+      throw new HoodieIOException("Failed to clean up after commit", e);
+    }
+  }
+
+  /**
+   * Common method used for cleaning out parquet files under a partition path during rollback of a
+   * set of commits
+   */
+  protected Map<FileStatus, Boolean> deleteCleanedFiles(String partitionPath, List<String> commits)
+      throws IOException {
+    logger.info("Cleaning path " + partitionPath);
+    FileSystem fs = getMetaClient().getFs();
+    FileStatus[] toBeDeleted = fs
+        .listStatus(new Path(config.getBasePath(), partitionPath), path -> {
+          if (!path.toString().contains(".parquet")) {
+            return false;
+          }
+          String fileCommitTime = FSUtils.getCommitTime(path.getName());
+          return commits.contains(fileCommitTime);
+        });
+    Map<FileStatus, Boolean> results = Maps.newHashMap();
+    for (FileStatus file : toBeDeleted) {
+      boolean success = fs.delete(file.getPath(), false);
+      results.put(file, success);
+      logger.info("Delete file " + file.getPath() + "\t" + success);
+    }
+    return results;
+  }
+
+  @Override
+  public List<HoodieRollbackStat> rollback(JavaSparkContext jsc, List<String> commits)
+      throws IOException {
+    String actionType = this.getCommitActionType();
+    HoodieActiveTimeline activeTimeline = this.getActiveTimeline();
+    List<String> inflights = this.getInflightCommitTimeline().getInstants()
+        .map(HoodieInstant::getTimestamp).collect(Collectors.toList());
+
+    // Atomically unpublish all the commits
+    commits.stream().filter(s -> !inflights.contains(s))
+        .map(s -> new HoodieInstant(false, actionType, s))
+        .forEach(activeTimeline::revertToInflight);
+    logger.info("Unpublished " + commits);
+
+    // delete all the data files for all these commits
+    logger.info("Clean out all parquet files generated for commits: " + commits);
+    List<HoodieRollbackStat> stats = jsc.parallelize(FSUtils
+        .getAllPartitionPaths(metaClient.getFs(), getMetaClient().getBasePath(),
+            config.shouldAssumeDatePartitioning()))
+        .map((Function<String, HoodieRollbackStat>) partitionPath -> {
+          // Scan all partitions files with this commit time
+          Map<FileStatus, Boolean> results = deleteCleanedFiles(partitionPath, commits);
+          return HoodieRollbackStat.newBuilder().withPartitionPath(partitionPath)
+              .withDeletedFileResults(results).build();
+        }).collect();
+
+    // clean temporary data files
+    cleanTemporaryDataFiles(jsc);
+
+    // Remove the rolled back inflight commits
+    commits.stream().map(s -> new HoodieInstant(true, actionType, s))
+        .forEach(activeTimeline::deleteInflight);
+    logger.info("Deleted inflight commits " + commits);
+    return stats;
+  }
+
+  /**
+   * Finalize the written data files
+   *
+   * @param writeStatuses List of WriteStatus
+   * @return number of files finalized
+   */
+  @Override
+  @SuppressWarnings("unchecked")
+  public Optional<Integer> finalizeWrite(JavaSparkContext jsc, List writeStatuses) {
+    if (!config.shouldUseTempFolderForCopyOnWrite()) {
+      return Optional.empty();
+    }
+
+    // This is to rename each data file from temporary path to its final location
+    List<Tuple2<String, Boolean>> results = jsc
+        .parallelize(writeStatuses, config.getFinalizeWriteParallelism()).map(writeStatus -> {
+          Tuple2<String, HoodieWriteStat> writeStatTuple2 = (Tuple2<String, HoodieWriteStat>)
+              writeStatus;
+          HoodieWriteStat writeStat = writeStatTuple2._2();
+          final FileSystem fs = getMetaClient().getFs();
+          final Path finalPath = new Path(config.getBasePath(), writeStat.getPath());
+
+          if (writeStat.getTempPath() != null) {
+            final Path tempPath = new Path(config.getBasePath(), writeStat.getTempPath());
+            boolean success;
+            try {
+              logger.info("Renaming temporary file: " + tempPath + " to " + finalPath);
+              success = fs.rename(tempPath, finalPath);
+            } catch (IOException e) {
+              throw new HoodieIOException(
+                  "Failed to rename file: " + tempPath + " to " + finalPath);
+            }
+
+            if (!success) {
+              throw new HoodieIOException(
+                  "Failed to rename file: " + tempPath + " to " + finalPath);
+            }
+          }
+
+          return new Tuple2<>(writeStat.getPath(), true);
+        }).collect();
+
+    // clean temporary data files
+    cleanTemporaryDataFiles(jsc);
+
+    return Optional.of(results.size());
+  }
+
+  /**
+   * Clean temporary data files that are produced from previous failed commit or retried spark
+   * stages.
+   */
+  private void cleanTemporaryDataFiles(JavaSparkContext jsc) {
+    if (!config.shouldUseTempFolderForCopyOnWrite()) {
+      return;
+    }
+
+    final FileSystem fs = getMetaClient().getFs();
+    final Path temporaryFolder = new Path(config.getBasePath(),
+        HoodieTableMetaClient.TEMPFOLDER_NAME);
+    try {
+      if (!fs.exists(temporaryFolder)) {
+        logger.info("Temporary folder does not exist: " + temporaryFolder);
+        return;
+      }
+      List<FileStatus> fileStatusesList = Arrays.asList(fs.listStatus(temporaryFolder));
+      List<Tuple2<String, Boolean>> results = jsc
+          .parallelize(fileStatusesList, config.getFinalizeWriteParallelism()).map(fileStatus -> {
+            FileSystem fs1 = getMetaClient().getFs();
+            boolean success = fs1.delete(fileStatus.getPath(), false);
+            logger
+                .info("Deleting file in temporary folder" + fileStatus.getPath() + "\t" + success);
+            return new Tuple2<>(fileStatus.getPath().toString(), success);
+          }).collect();
+
+      for (Tuple2<String, Boolean> result : results) {
+        if (!result._2()) {
+          logger.info("Failed to delete file: " + result._1());
+          throw new HoodieIOException("Failed to delete file in temporary folder: " + result._1());
+        }
+      }
+    } catch (IOException e) {
+      throw new HoodieIOException(
+          "Failed to clean data files in temporary folder: " + temporaryFolder);
+    }
+  }
+
+  private List<HoodieCleanStat> cleanPartitionPaths(List<String> partitionsToClean,
+      JavaSparkContext jsc) {
+    int cleanerParallelism = Math.min(partitionsToClean.size(), config.getCleanerParallelism());
+    logger.info("Using cleanerParallelism: " + cleanerParallelism);
+    List<Tuple2<String, PartitionCleanStat>> partitionCleanStats = jsc
+        .parallelize(partitionsToClean, cleanerParallelism)
+        .flatMapToPair(getFilesToDeleteFunc(this, config))
+        .repartition(cleanerParallelism)                    // repartition to remove skews
+        .mapPartitionsToPair(deleteFilesFunc(this)).reduceByKey(
+            // merge partition level clean stats below
+            (Function2<PartitionCleanStat, PartitionCleanStat, PartitionCleanStat>) (e1, e2) -> e1
+                .merge(e2)).collect();
+
+    Map<String, PartitionCleanStat> partitionCleanStatsMap = partitionCleanStats.stream()
+        .collect(Collectors.toMap(e -> e._1(), e -> e._2()));
+
+    HoodieCleanHelper cleaner = new HoodieCleanHelper(this, config);
+    // Return PartitionCleanStat for each partition passed.
+    return partitionsToClean.stream().map(partitionPath -> {
+      PartitionCleanStat partitionCleanStat =
+          (partitionCleanStatsMap.containsKey(partitionPath)) ? partitionCleanStatsMap
+              .get(partitionPath) : new PartitionCleanStat(partitionPath);
+      return HoodieCleanStat.newBuilder().withPolicy(config.getCleanerPolicy())
+          .withPartitionPath(partitionPath)
+          .withEarliestCommitRetained(cleaner.getEarliestCommitToRetain())
+          .withDeletePathPattern(partitionCleanStat.deletePathPatterns)
+          .withSuccessfulDeletes(partitionCleanStat.successDeleteFiles)
+          .withFailedDeletes(partitionCleanStat.failedDeleteFiles).build();
+    }).collect(Collectors.toList());
+  }

  enum BucketType {
-    UPDATE,
-    INSERT
+    UPDATE, INSERT
+  }
+
+  private static class PartitionCleanStat implements Serializable {
+
+    private final String partitionPath;
+    private final List<String> deletePathPatterns = new ArrayList<>();
+    private final List<String> successDeleteFiles = new ArrayList<>();
+    private final List<String> failedDeleteFiles = new ArrayList<>();
+
+    private PartitionCleanStat(String partitionPath) {
+      this.partitionPath = partitionPath;
+    }
+
+    private void addDeletedFileResult(String deletePathStr, Boolean deletedFileResult) {
+      if (deletedFileResult) {
+        successDeleteFiles.add(deletePathStr);
+      } else {
+        failedDeleteFiles.add(deletePathStr);
+      }
+    }
+
+    private void addDeleteFilePatterns(String deletePathStr) {
+      deletePathPatterns.add(deletePathStr);
+    }
+
+    private PartitionCleanStat merge(PartitionCleanStat other) {
+      if (!this.partitionPath.equals(other.partitionPath)) {
+        throw new RuntimeException(String
+            .format("partitionPath is not a match: (%s, %s)", partitionPath, other.partitionPath));
+      }
+      successDeleteFiles.addAll(other.successDeleteFiles);
+      deletePathPatterns.addAll(other.deletePathPatterns);
+      failedDeleteFiles.addAll(other.failedDeleteFiles);
+      return this;
+    }
  }

  /**
@@ -150,45 +552,37 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi
    }
  }

-
  /**
   * Packs incoming records to be upserted, into buckets (1 bucket = 1 RDD partition)
   */
  class UpsertPartitioner extends Partitioner {

+    /**
+     * List of all small files to be corrected
+     */
+    List<SmallFile> smallFiles = new ArrayList<SmallFile>();
    /**
     * Total number of RDD partitions, is determined by total buckets we want to pack the incoming
     * workload into
     */
    private int totalBuckets = 0;
-
    /**
     * Stat for the current workload. Helps in determining total inserts, upserts etc.
     */
    private WorkloadStat globalStat;
-
    /**
     * Helps decide which bucket an incoming update should go to.
     */
    private HashMap<String, Integer> updateLocationToBucket;
-
-
    /**
     * Helps us pack inserts into 1 or more buckets depending on number of incoming records.
     */
    private HashMap<String, List<InsertBucket>> partitionPathToInsertBuckets;
-
-
    /**
     * Remembers what type each bucket is for later.
     */
    private HashMap<Integer, BucketInfo> bucketInfoMap;

-    /**
-     * List of all small files to be corrected
-     */
-    List<SmallFile> smallFiles = new ArrayList<SmallFile>();
-
    UpsertPartitioner(WorkloadProfile profile) {
      updateLocationToBucket = new HashMap<>();
      partitionPathToInsertBuckets = new HashMap<>();
@@ -198,16 +592,17 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi
      assignUpdates(profile);
      assignInserts(profile);

-      logger.info("Total Buckets :" + totalBuckets + ", " +
-          "buckets info => " + bucketInfoMap + ", \n" +
-          "Partition to insert buckets => " + partitionPathToInsertBuckets + ", \n" +
-          "UpdateLocations mapped to buckets =>" + updateLocationToBucket);
+      logger.info(
+          "Total Buckets :" + totalBuckets + ", " + "buckets info => " + bucketInfoMap + ", \n"
+              + "Partition to insert buckets => " + partitionPathToInsertBuckets + ", \n"
+              + "UpdateLocations mapped to buckets =>" + updateLocationToBucket);
    }

    private void assignUpdates(WorkloadProfile profile) {
      // each update location gets a partition
      WorkloadStat gStat = profile.getGlobalStat();
-      for (Map.Entry<String, Pair<String, Long>> updateLocEntry : gStat.getUpdateLocationToCount().entrySet()) {
+      for (Map.Entry<String, Pair<String, Long>> updateLocEntry : gStat.getUpdateLocationToCount()
+          .entrySet()) {
        addUpdateBucket(updateLocEntry.getKey());
      }
    }
@@ -270,10 +665,10 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi
            }

            int insertBuckets = (int) Math.max(totalUnassignedInserts / insertRecordsPerBucket, 1L);
-            logger
-                .info("After small file assignment: unassignedInserts => " + totalUnassignedInserts
-                    + ", totalInsertBuckets => " + insertBuckets
-                    + ", recordsPerBucket => " + insertRecordsPerBucket);
+            logger.info(
+                "After small file assignment: unassignedInserts => " + totalUnassignedInserts
+                    + ", totalInsertBuckets => " + insertBuckets + ", recordsPerBucket => "
+                    + insertRecordsPerBucket);
            for (int b = 0; b < insertBuckets; b++) {
              bucketNumbers.add(totalBuckets);
              recordsPerBucket.add(totalUnassignedInserts / insertBuckets);
@@ -339,8 +734,8 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi
     */
    private long averageBytesPerRecord() {
      long avgSize = 0L;
-      HoodieTimeline commitTimeline =
-          metaClient.getActiveTimeline().getCommitTimeline().filterCompletedInstants();
+      HoodieTimeline commitTimeline = metaClient.getActiveTimeline().getCommitTimeline()
+          .filterCompletedInstants();
      try {
        if (!commitTimeline.empty()) {
          HoodieInstant latestCommitTime = commitTimeline.lastInstant().get();
@@ -372,7 +767,8 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi

    @Override
    public int getPartition(Object key) {
-      Tuple2<HoodieKey, Option<HoodieRecordLocation>> keyLocation = (Tuple2<HoodieKey, Option<HoodieRecordLocation>>) key;
+      Tuple2<HoodieKey, Option<HoodieRecordLocation>> keyLocation = (Tuple2<HoodieKey,
+          Option<HoodieRecordLocation>>) key;
      if (keyLocation._2().isDefined()) {
        HoodieRecordLocation location = keyLocation._2().get();
        return updateLocationToBucket.get(location.getFileId());
@@ -396,420 +792,4 @@ public class HoodieCopyOnWriteTable<T extends HoodieRecordPayload> extends Hoodi
      }
    }
  }
-
-
-  @Override
-  public Partitioner getUpsertPartitioner(WorkloadProfile profile) {
-    if (profile == null) {
-      throw new HoodieUpsertException("Need workload profile to construct the upsert partitioner.");
-    }
-    return new UpsertPartitioner(profile);
-  }
-
-  @Override
-  public Partitioner getInsertPartitioner(WorkloadProfile profile) {
-    return getUpsertPartitioner(profile);
-  }
-
-  @Override
-  public boolean isWorkloadProfileNeeded() {
-    return true;
-  }
-
-  @Override
-  public JavaRDD<WriteStatus> compact(JavaSparkContext jsc, String commitTime) {
-    throw new HoodieNotSupportedException("Compaction is not supported from a CopyOnWrite table");
-  }
-
-
-  public Iterator<List<WriteStatus>> handleUpdate(String commitTime, String fileLoc,
-                                                  Iterator<HoodieRecord<T>> recordItr)
-      throws IOException {
-    // these are updates
-    HoodieMergeHandle upsertHandle = getUpdateHandle(commitTime, fileLoc, recordItr);
-    return handleUpdateInternal(upsertHandle, commitTime, fileLoc);
-  }
-
-  public Iterator<List<WriteStatus>> handleUpdate(String commitTime, String fileLoc,
-                                                  Map<String, HoodieRecord<T>> keyToNewRecords)
-      throws IOException {
-    // these are updates
-    HoodieMergeHandle upsertHandle = getUpdateHandle(commitTime, fileLoc, keyToNewRecords);
-    return handleUpdateInternal(upsertHandle, commitTime, fileLoc);
-  }
-
-  protected Iterator<List<WriteStatus>> handleUpdateInternal(HoodieMergeHandle upsertHandle, String commitTime, String fileLoc)
-      throws IOException {
-    if (upsertHandle.getOldFilePath() == null) {
-      throw new HoodieUpsertException("Error in finding the old file path at commit " +
-          commitTime + " at fileLoc: " + fileLoc);
-    } else {
-      AvroReadSupport.setAvroReadSchema(getHadoopConf(), upsertHandle.getSchema());
-      ParquetReader<IndexedRecord> reader =
-          AvroParquetReader.builder(upsertHandle.getOldFilePath()).withConf(getHadoopConf())
-              .build();
-      try {
-        IndexedRecord record;
-        while ((record = reader.read()) != null) {
-          // Two types of writes here (new record, and old record).
-          // We have already catch the exception during writing new records.
-          // But for old records, we should fail if any exception happens.
-          upsertHandle.write((GenericRecord) record);
-        }
-      } catch (IOException e) {
-        throw new HoodieUpsertException(
-            "Failed to read record from " + upsertHandle.getOldFilePath()
-                + " with new Schema " + upsertHandle.getSchema(), e);
-      } finally {
-        reader.close();
-        upsertHandle.close();
-      }
-    }
-    //TODO(vc): This needs to be revisited
-    if (upsertHandle.getWriteStatus().getPartitionPath() == null) {
-      logger.info("Upsert Handle has partition path as null " + upsertHandle.getOldFilePath()
-          + ", " + upsertHandle.getWriteStatus());
-    }
-    return Collections.singletonList(Collections.singletonList(upsertHandle.getWriteStatus()))
-        .iterator();
-  }
-
-  protected HoodieMergeHandle getUpdateHandle(String commitTime, String fileLoc,
-      Iterator<HoodieRecord<T>> recordItr) {
-    return new HoodieMergeHandle<>(config, commitTime, this, recordItr, fileLoc);
-  }
-
-  protected HoodieMergeHandle getUpdateHandle(String commitTime, String fileLoc,
-                                              Map<String, HoodieRecord<T>> keyToNewRecords) {
-    return new HoodieMergeHandle<>(config, commitTime, this, keyToNewRecords, fileLoc);
-  }
-
-  public Iterator<List<WriteStatus>> handleInsert(String commitTime,
-      Iterator<HoodieRecord<T>> recordItr) throws Exception {
-    return new LazyInsertIterable<>(recordItr, config, commitTime, this);
-  }
-
-
-  @SuppressWarnings("unchecked")
-  @Override
-  public Iterator<List<WriteStatus>> handleUpsertPartition(String commitTime, Integer partition,
-      Iterator recordItr, Partitioner partitioner) {
-    UpsertPartitioner upsertPartitioner = (UpsertPartitioner) partitioner;
-    BucketInfo binfo = upsertPartitioner.getBucketInfo(partition);
-    BucketType btype = binfo.bucketType;
-    try {
-      if (btype.equals(BucketType.INSERT)) {
-        return handleInsert(commitTime, recordItr);
-      } else if (btype.equals(BucketType.UPDATE)) {
-        return handleUpdate(commitTime, binfo.fileLoc, recordItr);
-      } else {
-        throw new HoodieUpsertException(
-            "Unknown bucketType " + btype + " for partition :" + partition);
-      }
-    } catch (Throwable t) {
-      String msg = "Error upserting bucketType " + btype + " for partition :" + partition;
-      logger.error(msg, t);
-      throw new HoodieUpsertException(msg, t);
-    }
-  }
-
-  @Override
-  public Iterator<List<WriteStatus>> handleInsertPartition(String commitTime, Integer partition,
-      Iterator recordItr,
-      Partitioner partitioner) {
-    return handleUpsertPartition(commitTime, partition, recordItr, partitioner);
-  }
-
-  /**
-   * Performs cleaning of partition paths according to cleaning policy and returns the number of
-   * files cleaned. Handles skews in partitions to clean by making files to clean as the unit of
-   * task distribution.
-   *
-   * @throws IllegalArgumentException if unknown cleaning policy is provided
-   */
-  @Override
-  public List<HoodieCleanStat> clean(JavaSparkContext jsc) {
-    try {
-      FileSystem fs = getMetaClient().getFs();
-      List<String> partitionsToClean =
-          FSUtils.getAllPartitionPaths(fs, getMetaClient().getBasePath(),
-              config.shouldAssumeDatePartitioning());
-      logger.info("Partitions to clean up : " + partitionsToClean + ", with policy " + config
-          .getCleanerPolicy());
-      if (partitionsToClean.isEmpty()) {
-        logger.info("Nothing to clean here mom. It is already clean");
-        return Collections.emptyList();
-      }
-      return cleanPartitionPaths(partitionsToClean, jsc);
-    } catch (IOException e) {
-      throw new HoodieIOException("Failed to clean up after commit", e);
-    }
-  }
-
-  /**
-   * Common method used for cleaning out parquet files under a partition path during rollback of a
-   * set of commits
-   */
-  protected Map<FileStatus, Boolean> deleteCleanedFiles(String partitionPath, List<String> commits)
-      throws IOException {
-    logger.info("Cleaning path " + partitionPath);
-    FileSystem fs = getMetaClient().getFs();
-    FileStatus[] toBeDeleted =
-        fs.listStatus(new Path(config.getBasePath(), partitionPath), path -> {
-          if (!path.toString().contains(".parquet")) {
-            return false;
-          }
-          String fileCommitTime = FSUtils.getCommitTime(path.getName());
-          return commits.contains(fileCommitTime);
-        });
-    Map<FileStatus, Boolean> results = Maps.newHashMap();
-    for (FileStatus file : toBeDeleted) {
-      boolean success = fs.delete(file.getPath(), false);
-      results.put(file, success);
-      logger.info("Delete file " + file.getPath() + "\t" + success);
-    }
-    return results;
-  }
-
-  @Override
-  public List<HoodieRollbackStat> rollback(JavaSparkContext jsc, List<String> commits)
-      throws IOException {
-    String actionType = this.getCommitActionType();
-    HoodieActiveTimeline activeTimeline = this.getActiveTimeline();
-    List<String> inflights = this.getInflightCommitTimeline().getInstants()
-        .map(HoodieInstant::getTimestamp)
-        .collect(Collectors.toList());
-
-    // Atomically unpublish all the commits
-    commits.stream().filter(s -> !inflights.contains(s))
-        .map(s -> new HoodieInstant(false, actionType, s))
-        .forEach(activeTimeline::revertToInflight);
-    logger.info("Unpublished " + commits);
-
-    // delete all the data files for all these commits
-    logger.info("Clean out all parquet files generated for commits: " + commits);
-    List<HoodieRollbackStat> stats = jsc.parallelize(
-        FSUtils.getAllPartitionPaths(metaClient.getFs(), getMetaClient().getBasePath(),
-            config.shouldAssumeDatePartitioning()))
-        .map((Function<String, HoodieRollbackStat>) partitionPath -> {
-          // Scan all partitions files with this commit time
-          Map<FileStatus, Boolean> results = deleteCleanedFiles(partitionPath, commits);
-          return HoodieRollbackStat.newBuilder().withPartitionPath(partitionPath)
-              .withDeletedFileResults(results).build();
-        }).collect();
-
-    // clean temporary data files
-    cleanTemporaryDataFiles(jsc);
-
-    // Remove the rolled back inflight commits
-    commits.stream().map(s -> new HoodieInstant(true, actionType, s))
-        .forEach(activeTimeline::deleteInflight);
-    logger.info("Deleted inflight commits " + commits);
-    return stats;
-  }
-
-  /**
-   * Finalize the written data files
-   *
-   * @param writeStatuses List of WriteStatus
-   * @return number of files finalized
-   */
-  @Override
-  @SuppressWarnings("unchecked")
-  public Optional<Integer> finalizeWrite(JavaSparkContext jsc, List writeStatuses) {
-    if (!config.shouldUseTempFolderForCopyOnWrite()) {
-      return Optional.empty();
-    }
-
-    // This is to rename each data file from temporary path to its final location
-    List<Tuple2<String, Boolean>> results = jsc.parallelize(writeStatuses, config.getFinalizeWriteParallelism())
-        .map(writeStatus -> {
-          Tuple2<String, HoodieWriteStat> writeStatTuple2 = (Tuple2<String, HoodieWriteStat>) writeStatus;
-          HoodieWriteStat writeStat = writeStatTuple2._2();
-          final FileSystem fs = getMetaClient().getFs();
-          final Path finalPath = new Path(config.getBasePath(), writeStat.getPath());
-
-          if (writeStat.getTempPath() != null) {
-            final Path tempPath = new Path(config.getBasePath(), writeStat.getTempPath());
-            boolean success;
-            try {
-              logger.info("Renaming temporary file: " + tempPath + " to " + finalPath);
-              success = fs.rename(tempPath, finalPath);
-            } catch (IOException e) {
-              throw new HoodieIOException("Failed to rename file: " + tempPath + " to " + finalPath);
-            }
-
-            if (!success) {
-              throw new HoodieIOException("Failed to rename file: " + tempPath + " to " + finalPath);
-            }
-          }
-
-          return new Tuple2<>(writeStat.getPath(), true);
-        }).collect();
-
-    // clean temporary data files
-    cleanTemporaryDataFiles(jsc);
-
-    return Optional.of(results.size());
-  }
-
-  /**
-   * Clean temporary data files that are produced from previous failed commit or retried spark
-   * stages.
-   */
-  private void cleanTemporaryDataFiles(JavaSparkContext jsc) {
-    if (!config.shouldUseTempFolderForCopyOnWrite()) {
-      return;
-    }
-
-    final FileSystem fs = getMetaClient().getFs();
-    final Path temporaryFolder = new Path(config.getBasePath(),
-        HoodieTableMetaClient.TEMPFOLDER_NAME);
-    try {
-      if (!fs.exists(temporaryFolder)) {
-        logger.info("Temporary folder does not exist: " + temporaryFolder);
-        return;
-      }
-      List<FileStatus> fileStatusesList = Arrays.asList(fs.listStatus(temporaryFolder));
-      List<Tuple2<String, Boolean>> results = jsc
-          .parallelize(fileStatusesList, config.getFinalizeWriteParallelism())
-          .map(fileStatus -> {
-            FileSystem fs1 = getMetaClient().getFs();
-            boolean success = fs1.delete(fileStatus.getPath(), false);
-            logger.info("Deleting file in temporary folder" + fileStatus.getPath() + "\t"
-                + success);
-            return new Tuple2<>(fileStatus.getPath().toString(), success);
-          }).collect();
-
-      for (Tuple2<String, Boolean> result : results) {
-        if (!result._2()) {
-          logger.info("Failed to delete file: " + result._1());
-          throw new HoodieIOException(
-              "Failed to delete file in temporary folder: " + result._1());
-        }
-      }
-    } catch (IOException e) {
-      throw new HoodieIOException(
-          "Failed to clean data files in temporary folder: " + temporaryFolder);
-    }
-  }
-
-  private static class PartitionCleanStat implements Serializable {
-
-    private final String partitionPath;
-    private final List<String> deletePathPatterns = new ArrayList<>();
-    private final List<String> successDeleteFiles = new ArrayList<>();
-    private final List<String> failedDeleteFiles = new ArrayList<>();
-
-    private PartitionCleanStat(String partitionPath) {
-      this.partitionPath = partitionPath;
-    }
-
-    private void addDeletedFileResult(String deletePathStr, Boolean deletedFileResult) {
-      if (deletedFileResult) {
-        successDeleteFiles.add(deletePathStr);
-      } else {
-        failedDeleteFiles.add(deletePathStr);
-      }
-    }
-
-    private void addDeleteFilePatterns(String deletePathStr) {
-      deletePathPatterns.add(deletePathStr);
-    }
-
-    private PartitionCleanStat merge(PartitionCleanStat other) {
-      if (!this.partitionPath.equals(other.partitionPath)) {
-        throw new RuntimeException(String.format(
-            "partitionPath is not a match: (%s, %s)",
-            partitionPath, other.partitionPath));
-      }
-      successDeleteFiles.addAll(other.successDeleteFiles);
-      deletePathPatterns.addAll(other.deletePathPatterns);
-      failedDeleteFiles.addAll(other.failedDeleteFiles);
-      return this;
-    }
-  }
-
-  private List<HoodieCleanStat> cleanPartitionPaths(List<String> partitionsToClean,
-      JavaSparkContext jsc) {
-    int cleanerParallelism = Math.min(partitionsToClean.size(), config.getCleanerParallelism());
-    logger.info("Using cleanerParallelism: " + cleanerParallelism);
-    List<Tuple2<String, PartitionCleanStat>> partitionCleanStats = jsc
-        .parallelize(partitionsToClean, cleanerParallelism)
-        .flatMapToPair(getFilesToDeleteFunc(this, config))
-        .repartition(cleanerParallelism)                    // repartition to remove skews
-        .mapPartitionsToPair(deleteFilesFunc(this))
-        .reduceByKey(
-            // merge partition level clean stats below
-            (Function2<PartitionCleanStat, PartitionCleanStat, PartitionCleanStat>) (e1, e2) -> e1
-                .merge(e2))
-        .collect();
-
-    Map<String, PartitionCleanStat> partitionCleanStatsMap = partitionCleanStats
-        .stream().collect(Collectors.toMap(e -> e._1(), e -> e._2()));
-
-    HoodieCleanHelper cleaner = new HoodieCleanHelper(this, config);
-    // Return PartitionCleanStat for each partition passed.
-    return partitionsToClean.stream().map(partitionPath -> {
-      PartitionCleanStat partitionCleanStat =
-          (partitionCleanStatsMap.containsKey(partitionPath)) ?
-              partitionCleanStatsMap.get(partitionPath)
-              : new PartitionCleanStat(partitionPath);
-      return HoodieCleanStat.newBuilder()
-          .withPolicy(config.getCleanerPolicy())
-          .withPartitionPath(partitionPath)
-          .withEarliestCommitRetained(cleaner.getEarliestCommitToRetain())
-          .withDeletePathPattern(partitionCleanStat.deletePathPatterns)
-          .withSuccessfulDeletes(partitionCleanStat.successDeleteFiles)
-          .withFailedDeletes(partitionCleanStat.failedDeleteFiles)
-          .build();
-    }).collect(Collectors.toList());
-  }
-
-  private static PairFlatMapFunction<Iterator<Tuple2<String, String>>, String, PartitionCleanStat> deleteFilesFunc(
-      HoodieTable table) {
-    return (PairFlatMapFunction<Iterator<Tuple2<String, String>>, String, PartitionCleanStat>) iter -> {
-      Map<String, PartitionCleanStat> partitionCleanStatMap = new HashMap<>();
-
-      FileSystem fs = table.getMetaClient().getFs();
-      while (iter.hasNext()) {
-        Tuple2<String, String> partitionDelFileTuple = iter.next();
-        String partitionPath = partitionDelFileTuple._1();
-        String deletePathStr = partitionDelFileTuple._2();
-        Boolean deletedFileResult = deleteFileAndGetResult(fs, deletePathStr);
-        if (!partitionCleanStatMap.containsKey(partitionPath)) {
-          partitionCleanStatMap.put(partitionPath,
-              new PartitionCleanStat(partitionPath));
-        }
-        PartitionCleanStat partitionCleanStat = partitionCleanStatMap.get(partitionPath);
-        partitionCleanStat.addDeleteFilePatterns(deletePathStr);
-        partitionCleanStat.addDeletedFileResult(deletePathStr, deletedFileResult);
-      }
-
-      return partitionCleanStatMap.entrySet().stream()
-          .map(e -> new Tuple2<>(e.getKey(), e.getValue()))
-          .collect(Collectors.toList()).iterator();
-    };
-  }
-
-  private static PairFlatMapFunction<String, String, String> getFilesToDeleteFunc(
-      HoodieTable table, HoodieWriteConfig config) {
-    return (PairFlatMapFunction<String, String, String>) partitionPathToClean -> {
-      HoodieCleanHelper cleaner = new HoodieCleanHelper(table, config);
-      return cleaner.getDeletePaths(partitionPathToClean).stream()
-          .map(deleteFile -> new Tuple2<>(partitionPathToClean, deleteFile.toString()))
-          .iterator();
-    };
-  }
-
-  private static Boolean deleteFileAndGetResult(FileSystem fs, String deletePathStr)
-      throws IOException {
-    Path deletePath = new Path(deletePathStr);
-    logger.debug("Working on delete path :" + deletePath);
-    boolean deleteResult = fs.delete(deletePath, false);
-    if (deleteResult) {
-      logger.debug("Cleaned file at path :" + deletePath);
-    }
-    return deleteResult;
-  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieMergeOnReadTable.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieMergeOnReadTable.java
@@ -62,19 +62,12 @@ import org.apache.spark.api.java.JavaSparkContext;
 import org.apache.spark.api.java.function.Function;

 /**
- * Implementation of a more real-time read-optimized Hoodie Table where
- * <p>
- * INSERTS - Same as HoodieCopyOnWriteTable - Produce new files, block aligned to desired size (or)
- * Merge with the smallest existing file, to expand it
- * </p>
- * <p>
- * UPDATES - Appends the changes to a rolling log file maintained per file Id. Compaction merges the
- * log file into the base file.
- * </p>
- * <p>
- * WARNING - MOR table type does not support nested rollbacks, every rollback must be followed by an
- * attempted commit action
- * </p>
+ * Implementation of a more real-time read-optimized Hoodie Table where <p> INSERTS - Same as
+ * HoodieCopyOnWriteTable - Produce new files, block aligned to desired size (or) Merge with the
+ * smallest existing file, to expand it </p> <p> UPDATES - Appends the changes to a rolling log file
+ * maintained per file Id. Compaction merges the log file into the base file. </p> <p> WARNING - MOR
+ * table type does not support nested rollbacks, every rollback must be followed by an attempted
+ * commit action </p>
 */
 public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
    HoodieCopyOnWriteTable<T> {
@@ -88,57 +81,6 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
    super(config, metaClient);
  }

-  /**
-   * UpsertPartitioner for MergeOnRead table type, this allows auto correction of small parquet
-   * files to larger ones without the need for an index in the logFile.
-   */
-  class MergeOnReadUpsertPartitioner extends HoodieCopyOnWriteTable.UpsertPartitioner {
-
-    MergeOnReadUpsertPartitioner(WorkloadProfile profile) {
-      super(profile);
-    }
-
-    @Override
-    protected List<SmallFile> getSmallFiles(String partitionPath) {
-
-      // smallFiles only for partitionPath
-      List<SmallFile> smallFileLocations = new ArrayList<>();
-
-      // Init here since this class (and member variables) might not have been initialized
-      HoodieTimeline commitTimeline = getCompletedCommitTimeline();
-
-      if (!commitTimeline.empty()) {
-        HoodieInstant latestCommitTime = commitTimeline.lastInstant().get();
-        // find smallest file in partition and append to it
-        Optional<FileSlice> smallFileSlice = getRTFileSystemView()
-            .getLatestFileSlicesBeforeOrOn(partitionPath, latestCommitTime.getTimestamp())
-            .filter(fileSlice -> fileSlice.getLogFiles().count() < 1 &&
-                fileSlice.getDataFile().get().getFileSize() < config.getParquetSmallFileLimit())
-            .sorted((FileSlice left, FileSlice right) ->
-                left.getDataFile().get().getFileSize() < right.getDataFile().get().getFileSize() ? -1 : 1)
-            .findFirst();
-
-        if(smallFileSlice.isPresent()) {
-          String filename = smallFileSlice.get().getDataFile().get().getFileName();
-          SmallFile sf = new SmallFile();
-          sf.location = new HoodieRecordLocation(FSUtils.getCommitTime(filename),
-              FSUtils.getFileId(filename));
-          sf.sizeBytes = smallFileSlice.get().getDataFile().get().getFileSize();
-          smallFileLocations.add(sf);
-          // Update the global small files list
-          smallFiles.add(sf);
-        }
-        }
-
-      return smallFileLocations;
-    }
-
-    public List<String> getSmallFileIds() {
-      return (List<String>) smallFiles.stream().map(smallFile -> ((SmallFile) smallFile).location.getFileId())
-          .collect(Collectors.toList());
-    }
-  }
-
  @Override
  public Partitioner getUpsertPartitioner(WorkloadProfile profile) {
    if (profile == null) {
@@ -154,11 +96,12 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
    logger.info("Merging updates for commit " + commitTime + " for file " + fileId);

    if (mergeOnReadUpsertPartitioner.getSmallFileIds().contains(fileId)) {
-      logger.info("Small file corrections for updates for commit " + commitTime + " for file " + fileId);
+      logger.info(
+          "Small file corrections for updates for commit " + commitTime + " for file " + fileId);
      return super.handleUpdate(commitTime, fileId, recordItr);
    } else {
-      HoodieAppendHandle<T> appendHandle =
-          new HoodieAppendHandle<>(config, commitTime, this, fileId, recordItr);
+      HoodieAppendHandle<T> appendHandle = new HoodieAppendHandle<>(config, commitTime, this,
+          fileId, recordItr);
      appendHandle.doAppend();
      appendHandle.close();
      return Collections.singletonList(Collections.singletonList(appendHandle.getWriteStatus()))
@@ -202,11 +145,9 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
    if (commits.size() > 1) {
      throw new UnsupportedOperationException("Nested Rollbacks are not supported");
    }
-    Map<String, HoodieInstant> commitsAndCompactions =
-        this.getActiveTimeline()
+    Map<String, HoodieInstant> commitsAndCompactions = this.getActiveTimeline()
        .getTimelineOfActions(Sets.newHashSet(HoodieActiveTimeline.COMMIT_ACTION,
-                HoodieActiveTimeline.DELTA_COMMIT_ACTION))
-            .getInstants()
+            HoodieActiveTimeline.DELTA_COMMIT_ACTION)).getInstants()
        .filter(i -> commits.contains(i.getTimestamp()))
        .collect(Collectors.toMap(i -> i.getTimestamp(), i -> i));

@@ -218,9 +159,9 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends

    Long startTime = System.currentTimeMillis();

-    List<HoodieRollbackStat> allRollbackStats = jsc.parallelize
-        (FSUtils.getAllPartitionPaths(this.metaClient.getFs(),
-            this.getMetaClient().getBasePath(), config.shouldAssumeDatePartitioning()))
+    List<HoodieRollbackStat> allRollbackStats = jsc.parallelize(FSUtils
+        .getAllPartitionPaths(this.metaClient.getFs(), this.getMetaClient().getBasePath(),
+            config.shouldAssumeDatePartitioning()))
        .map((Function<String, List<HoodieRollbackStat>>) partitionPath -> {
          return commits.stream().map(commit -> {
            HoodieInstant instant = commitsAndCompactions.get(commit);
@@ -228,23 +169,27 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
            switch (instant.getAction()) {
              case HoodieTimeline.COMMIT_ACTION:
                try {
-                  Map<FileStatus, Boolean> results = super.deleteCleanedFiles(partitionPath, Arrays.asList(commit));
-                  hoodieRollbackStats = HoodieRollbackStat.newBuilder().withPartitionPath(partitionPath)
-                      .withDeletedFileResults(results).build();
+                  Map<FileStatus, Boolean> results = super
+                      .deleteCleanedFiles(partitionPath, Arrays.asList(commit));
+                  hoodieRollbackStats = HoodieRollbackStat.newBuilder()
+                      .withPartitionPath(partitionPath).withDeletedFileResults(results).build();
                  break;
                } catch (IOException io) {
                  throw new UncheckedIOException("Failed to rollback for commit " + commit, io);
                }
              case HoodieTimeline.DELTA_COMMIT_ACTION:
                try {
-                  HoodieCommitMetadata commitMetadata = HoodieCommitMetadata
-                      .fromBytes(this.getCommitTimeline().getInstantDetails(new HoodieInstant(true, instant.getAction(), instant.getTimestamp())).get());
+                  HoodieCommitMetadata commitMetadata = HoodieCommitMetadata.fromBytes(
+                      this.getCommitTimeline().getInstantDetails(
+                          new HoodieInstant(true, instant.getAction(), instant.getTimestamp()))
+                          .get());

                  // read commit file and (either append delete blocks or delete file)
                  Map<FileStatus, Boolean> filesToDeletedStatus = new HashMap<>();
                  Map<FileStatus, Long> filesToNumBlocksRollback = new HashMap<>();

-                  // we do not know fileIds for inserts (first inserts are parquet files), delete all parquet files for the corresponding failed commit, if present (same as COW)
+                  // we do not know fileIds for inserts (first inserts are parquet files), delete
+                  // all parquet files for the corresponding failed commit, if present (same as COW)
                  filesToDeletedStatus = super
                      .deleteCleanedFiles(partitionPath, Arrays.asList(commit));

@@ -252,32 +197,35 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
                  if (commitMetadata.getPartitionToWriteStats().containsKey(partitionPath)) {
                    commitMetadata.getPartitionToWriteStats().get(partitionPath).stream()
                        .filter(wStat -> {
-                          return wStat != null && wStat.getPrevCommit() != HoodieWriteStat.NULL_COMMIT
+                          return wStat != null
+                              && wStat.getPrevCommit() != HoodieWriteStat.NULL_COMMIT
                              && wStat.getPrevCommit() != null;
-                        })
-                        .forEach(wStat -> {
+                        }).forEach(wStat -> {
                          HoodieLogFormat.Writer writer = null;
                          try {
-                            writer = HoodieLogFormat.newWriterBuilder()
-                                .onParentPath(new Path(this.getMetaClient().getBasePath(), partitionPath))
+                            writer = HoodieLogFormat.newWriterBuilder().onParentPath(
+                                new Path(this.getMetaClient().getBasePath(), partitionPath))
                                .withFileId(wStat.getFileId()).overBaseCommit(wStat.getPrevCommit())
                                .withFs(this.metaClient.getFs())
                                .withFileExtension(HoodieLogFile.DELTA_EXTENSION).build();
                            Long numRollbackBlocks = 0L;
                            // generate metadata
-                            Map<HoodieLogBlock.HeaderMetadataType, String> header = Maps.newHashMap();
+                            Map<HoodieLogBlock.HeaderMetadataType, String> header =
+                                Maps.newHashMap();
                            header.put(HoodieLogBlock.HeaderMetadataType.INSTANT_TIME,
                                metaClient.getActiveTimeline().lastInstant().get().getTimestamp());
-                            header.put(HoodieLogBlock.HeaderMetadataType.TARGET_INSTANT_TIME, commit);
-                            header.put(HoodieLogBlock.HeaderMetadataType.COMMAND_BLOCK_TYPE,
-                                String.valueOf(HoodieCommandBlock.HoodieCommandBlockTypeEnum.ROLLBACK_PREVIOUS_BLOCK.ordinal()));
+                            header.put(HoodieLogBlock.HeaderMetadataType.TARGET_INSTANT_TIME,
+                                commit);
+                            header.put(HoodieLogBlock.HeaderMetadataType.COMMAND_BLOCK_TYPE, String
+                                .valueOf(
+                                    HoodieCommandBlock.HoodieCommandBlockTypeEnum
+                                        .ROLLBACK_PREVIOUS_BLOCK
+                                        .ordinal()));
                            // if update belongs to an existing log file
-                            writer = writer.appendBlock(new HoodieCommandBlock(
-                                header));
+                            writer = writer.appendBlock(new HoodieCommandBlock(header));
                            numRollbackBlocks++;
-                            filesToNumBlocksRollback
-                                .put(this.getMetaClient().getFs().getFileStatus(writer.getLogFile().getPath()),
-                                    numRollbackBlocks);
+                            filesToNumBlocksRollback.put(this.getMetaClient().getFs()
+                                .getFileStatus(writer.getLogFile().getPath()), numRollbackBlocks);
                          } catch (IOException | InterruptedException io) {
                            throw new HoodieRollbackException(
                                "Failed to rollback for commit " + commit, io);
@@ -289,7 +237,8 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
                            }
                          }
                        });
-                    hoodieRollbackStats = HoodieRollbackStat.newBuilder().withPartitionPath(partitionPath)
+                    hoodieRollbackStats = HoodieRollbackStat.newBuilder()
+                        .withPartitionPath(partitionPath)
                        .withDeletedFileResults(filesToDeletedStatus)
                        .withRollbackBlockAppendResults(filesToNumBlocksRollback).build();
                  }
@@ -297,17 +246,19 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
                } catch (IOException io) {
                  throw new UncheckedIOException("Failed to rollback for commit " + commit, io);
                }
+              default:
+                break;
            }
            return hoodieRollbackStats;
          }).collect(Collectors.toList());
        }).flatMap(x -> x.iterator()).filter(x -> x != null).collect();

-    commitsAndCompactions.entrySet().stream()
-        .map(entry -> new HoodieInstant(true, entry.getValue().getAction(),
-            entry.getValue().getTimestamp()))
-        .forEach(this.getActiveTimeline()::deleteInflight);
+    commitsAndCompactions.entrySet().stream().map(
+        entry -> new HoodieInstant(true, entry.getValue().getAction(),
+            entry.getValue().getTimestamp())).forEach(this.getActiveTimeline()::deleteInflight);

-    logger.debug("Time(in ms) taken to finish rollback " + (System.currentTimeMillis() - startTime));
+    logger
+        .debug("Time(in ms) taken to finish rollback " + (System.currentTimeMillis() - startTime));

    return allRollbackStats;
  }
@@ -317,4 +268,56 @@ public class HoodieMergeOnReadTable<T extends HoodieRecordPayload> extends
    // do nothing for MOR tables
    return Optional.empty();
  }
+
+  /**
+   * UpsertPartitioner for MergeOnRead table type, this allows auto correction of small parquet
+   * files to larger ones without the need for an index in the logFile.
+   */
+  class MergeOnReadUpsertPartitioner extends HoodieCopyOnWriteTable.UpsertPartitioner {
+
+    MergeOnReadUpsertPartitioner(WorkloadProfile profile) {
+      super(profile);
+    }
+
+    @Override
+    protected List<SmallFile> getSmallFiles(String partitionPath) {
+
+      // smallFiles only for partitionPath
+      List<SmallFile> smallFileLocations = new ArrayList<>();
+
+      // Init here since this class (and member variables) might not have been initialized
+      HoodieTimeline commitTimeline = getCompletedCommitTimeline();
+
+      if (!commitTimeline.empty()) {
+        HoodieInstant latestCommitTime = commitTimeline.lastInstant().get();
+        // find smallest file in partition and append to it
+        Optional<FileSlice> smallFileSlice = getRTFileSystemView()
+            .getLatestFileSlicesBeforeOrOn(partitionPath, latestCommitTime.getTimestamp()).filter(
+                fileSlice -> fileSlice.getLogFiles().count() < 1
+                    && fileSlice.getDataFile().get().getFileSize() < config
+                    .getParquetSmallFileLimit()).sorted((FileSlice left, FileSlice right) ->
+                left.getDataFile().get().getFileSize() < right.getDataFile().get().getFileSize()
+                    ? -1 : 1).findFirst();
+
+        if (smallFileSlice.isPresent()) {
+          String filename = smallFileSlice.get().getDataFile().get().getFileName();
+          SmallFile sf = new SmallFile();
+          sf.location = new HoodieRecordLocation(FSUtils.getCommitTime(filename),
+              FSUtils.getFileId(filename));
+          sf.sizeBytes = smallFileSlice.get().getDataFile().get().getFileSize();
+          smallFileLocations.add(sf);
+          // Update the global small files list
+          smallFiles.add(sf);
+        }
+      }
+
+      return smallFileLocations;
+    }
+
+    public List<String> getSmallFileIds() {
+      return (List<String>) smallFiles.stream()
+          .map(smallFile -> ((SmallFile) smallFile).location.getFileId())
+          .collect(Collectors.toList());
+    }
+  }
 }
--- a/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieTable.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/HoodieTable.java
@@ -60,18 +60,28 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
    this.metaClient = metaClient;
  }

+  public static <T extends HoodieRecordPayload> HoodieTable<T> getHoodieTable(
+      HoodieTableMetaClient metaClient, HoodieWriteConfig config) {
+    switch (metaClient.getTableType()) {
+      case COPY_ON_WRITE:
+        return new HoodieCopyOnWriteTable<>(config, metaClient);
+      case MERGE_ON_READ:
+        return new HoodieMergeOnReadTable<>(config, metaClient);
+      default:
+        throw new HoodieException("Unsupported table type :" + metaClient.getTableType());
+    }
+  }
+
  /**
   * Provides a partitioner to perform the upsert operation, based on the workload profile
   */
  public abstract Partitioner getUpsertPartitioner(WorkloadProfile profile);

-
  /**
   * Provides a partitioner to perform the insert operation, based on the workload profile
   */
  public abstract Partitioner getInsertPartitioner(WorkloadProfile profile);

-
  /**
   * Return whether this HoodieTable implementation can benefit from workload profiling
   */
@@ -131,7 +141,6 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
    return getCommitsTimeline().filterInflights();
  }

-
  /**
   * Get only the completed (no-inflights) clean timeline
   */
@@ -162,12 +171,12 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
      throw new HoodieSavepointException(
          "Could not get data files for savepoint " + savepointTime + ". No such savepoint.");
    }
-    HoodieInstant instant =
-        new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION, savepointTime);
+    HoodieInstant instant = new HoodieInstant(false, HoodieTimeline.SAVEPOINT_ACTION,
+        savepointTime);
    HoodieSavepointMetadata metadata = null;
    try {
-      metadata = AvroUtils.deserializeHoodieSavepointMetadata(
-          getActiveTimeline().getInstantDetails(instant).get());
+      metadata = AvroUtils
+          .deserializeHoodieSavepointMetadata(getActiveTimeline().getInstantDetails(instant).get());
    } catch (IOException e) {
      throw new HoodieSavepointException(
          "Could not get savepointed data files for savepoint " + savepointTime, e);
@@ -189,7 +198,8 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
        return getActiveTimeline().getCommitTimeline();
      case MERGE_ON_READ:
        // We need to include the parquet files written out in delta commits
-        // Include commit action to be able to start doing a MOR over a COW dataset - no migration required
+        // Include commit action to be able to start doing a MOR over a COW dataset - no
+        // migration required
        return getActiveTimeline().getCommitsTimeline();
      default:
        throw new HoodieException("Unsupported table type :" + metaClient.getTableType());
@@ -219,10 +229,11 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
        return HoodieActiveTimeline.COMMIT_ACTION;
      case MERGE_ON_READ:
        return HoodieActiveTimeline.DELTA_COMMIT_ACTION;
-    }
+      default:
        throw new HoodieCommitException(
            "Could not commit on unknown storage type " + metaClient.getTableType());
    }
+  }

  /**
   * Perform the ultimate IO for a given upserted (RDD) partition
@@ -236,21 +247,9 @@ public abstract class HoodieTable<T extends HoodieRecordPayload> implements Seri
  public abstract Iterator<List<WriteStatus>> handleInsertPartition(String commitTime,
      Integer partition, Iterator<HoodieRecord<T>> recordIterator, Partitioner partitioner);

-  public static <T extends HoodieRecordPayload> HoodieTable<T> getHoodieTable(
-      HoodieTableMetaClient metaClient, HoodieWriteConfig config) {
-    switch (metaClient.getTableType()) {
-      case COPY_ON_WRITE:
-        return new HoodieCopyOnWriteTable<>(config, metaClient);
-      case MERGE_ON_READ:
-        return new HoodieMergeOnReadTable<>(config, metaClient);
-      default:
-        throw new HoodieException("Unsupported table type :" + metaClient.getTableType());
-    }
-  }
-
  /**
-   * Run Compaction on the table.
-   * Compaction arranges the data so that it is optimized for data access
+   * Run Compaction on the table. Compaction arranges the data so that it is optimized for data
+   * access
   */
  public abstract JavaRDD<WriteStatus> compact(JavaSparkContext jsc, String commitTime);

--- a/hoodie-client/src/main/java/com/uber/hoodie/table/UserDefinedBulkInsertPartitioner.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/UserDefinedBulkInsertPartitioner.java
@@ -13,6 +13,7 @@
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
+
 package com.uber.hoodie.table;

 import com.uber.hoodie.common.model.HoodieRecord;
--- a/hoodie-client/src/main/java/com/uber/hoodie/table/WorkloadProfile.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/WorkloadProfile.java
@@ -16,7 +16,6 @@

 package com.uber.hoodie.table;

-
 import com.uber.hoodie.common.model.HoodieRecord;
 import com.uber.hoodie.common.model.HoodieRecordLocation;
 import com.uber.hoodie.common.model.HoodieRecordPayload;
@@ -31,7 +30,7 @@ import scala.Tuple2;
 /**
 * Information about incoming records for upsert/insert obtained either via sampling or
 * introspecting the data fully
- *
+ * <p>
 * TODO(vc): Think about obtaining this directly from index.tagLocation
 */
 public class WorkloadProfile<T extends HoodieRecordPayload> implements Serializable {
@@ -60,11 +59,9 @@ public class WorkloadProfile<T extends HoodieRecordPayload> implements Serializa
  private void buildProfile() {

    Map<Tuple2<String, Option<HoodieRecordLocation>>, Long> partitionLocationCounts = taggedRecords
-        .mapToPair(record ->
-            new Tuple2<>(
+        .mapToPair(record -> new Tuple2<>(
            new Tuple2<>(record.getPartitionPath(), Option.apply(record.getCurrentLocation())),
-                record))
-        .countByKey();
+            record)).countByKey();

    for (Map.Entry<Tuple2<String, Option<HoodieRecordLocation>>, Long> e : partitionLocationCounts
        .entrySet()) {
--- a/hoodie-client/src/main/java/com/uber/hoodie/table/WorkloadStat.java
+++ b/hoodie-client/src/main/java/com/uber/hoodie/table/WorkloadStat.java
@@ -17,10 +17,9 @@
 package com.uber.hoodie.table;

 import com.uber.hoodie.common.model.HoodieRecordLocation;
-import org.apache.commons.lang3.tuple.Pair;
-
 import java.io.Serializable;
 import java.util.HashMap;
+import org.apache.commons.lang3.tuple.Pair;

 /**
 * Wraps stats about a single partition path.
--- a/hoodie-client/src/test/java/HoodieClientExample.java
+++ b/hoodie-client/src/test/java/HoodieClientExample.java
@@ -14,7 +14,6 @@
 * limitations under the License.
 */

-
 import com.beust.jcommander.JCommander;
 import com.beust.jcommander.Parameter;
 import com.uber.hoodie.HoodieWriteClient;
@@ -38,24 +37,19 @@ import org.apache.spark.api.java.JavaRDD;
 import org.apache.spark.api.java.JavaSparkContext;

 /**
- * Driver program that uses the Hoodie client with synthetic workload, and performs basic
- * operations. <p>
+ * Driver program that uses the Hoodie client with synthetic workload, and performs basic operations. <p>
 */
 public class HoodieClientExample {

-  @Parameter(names = {"--table-path", "-p"}, description = "path for Hoodie sample table")
-  private String tablePath = "file:///tmp/hoodie/sample-table";
-
-  @Parameter(names = {"--table-name", "-n"}, description = "table name for Hoodie sample table")
-  private String tableName = "hoodie_rt";
-
-  @Parameter(names = {"--table-type", "-t"}, description = "One of COPY_ON_WRITE or MERGE_ON_READ")
-  private String tableType = HoodieTableType.COPY_ON_WRITE.name();
-
+  private static Logger logger = LogManager.getLogger(HoodieClientExample.class);
  @Parameter(names = {"--help", "-h"}, help = true)
  public Boolean help = false;
-
-  private static Logger logger = LogManager.getLogger(HoodieClientExample.class);
+  @Parameter(names = {"--table-path", "-p"}, description = "path for Hoodie sample table")
+  private String tablePath = "file:///tmp/hoodie/sample-table";
+  @Parameter(names = {"--table-name", "-n"}, description = "table name for Hoodie sample table")
+  private String tableName = "hoodie_rt";
+  @Parameter(names = {"--table-type", "-t"}, description = "One of COPY_ON_WRITE or MERGE_ON_READ")
+  private String tableType = HoodieTableType.COPY_ON_WRITE.name();

  public static void main(String[] args) throws Exception {
    HoodieClientExample cli = new HoodieClientExample();
@@ -92,10 +86,10 @@ public class HoodieClientExample {
    // Create the write client to write some records in
    HoodieWriteConfig cfg = HoodieWriteConfig.newBuilder().withPath(tablePath)
        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
-        .forTable(tableName).withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(IndexType.BLOOM).build())
-        .withCompactionConfig(HoodieCompactionConfig.newBuilder().archiveCommitsWith(2, 3).build())
-        .build();
+        .forTable(tableName)
+        .withIndexConfig(HoodieIndexConfig.newBuilder().withIndexType(IndexType.BLOOM).build())
+        .withCompactionConfig(
+            HoodieCompactionConfig.newBuilder().archiveCommitsWith(2, 3).build()).build();
    HoodieWriteClient client = new HoodieWriteClient(jsc, cfg);

    /**
--- a/hoodie-client/src/test/java/com/uber/hoodie/TestHoodieClientOnCopyOnWriteStorage.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/TestHoodieClientOnCopyOnWriteStorage.java
--- a/hoodie-client/src/test/java/com/uber/hoodie/TestMultiFS.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/TestMultiFS.java
@@ -16,7 +16,6 @@

 package com.uber.hoodie;

-
 import static org.junit.Assert.assertEquals;

 import com.uber.hoodie.common.HoodieClientTestUtils;
@@ -58,11 +57,11 @@ public class TestMultiFS implements Serializable {
  private static MiniDFSCluster dfsCluster;
  private static DistributedFileSystem dfs;
  private static Logger logger = LogManager.getLogger(TestMultiFS.class);
+  private static JavaSparkContext jsc;
+  private static SQLContext sqlContext;
  private String tablePath = "file:///tmp/hoodie/sample-table";
  private String tableName = "hoodie_rt";
  private String tableType = HoodieTableType.COPY_ON_WRITE.name();
-  private static JavaSparkContext jsc;
-  private static SQLContext sqlContext;

  @BeforeClass
  public static void initClass() throws Exception {
@@ -92,7 +91,8 @@ public class TestMultiFS implements Serializable {
      hdfsTestService.stop();
      dfsCluster.shutdown();
    }
-    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the same JVM
+    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the
+    // same JVM
    FileSystem.closeAll();
  }

@@ -111,8 +111,7 @@ public class TestMultiFS implements Serializable {
    HoodieWriteConfig cfg = HoodieWriteConfig.newBuilder().withPath(dfsBasePath)
        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
        .forTable(tableName).withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build())
-        .build();
+            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build()).build();
    HoodieWriteClient hdfsWriteClient = new HoodieWriteClient(jsc, cfg);

    // Write generated data to hdfs (only inserts)
@@ -125,10 +124,8 @@ public class TestMultiFS implements Serializable {
    // Read from hdfs
    FileSystem fs = FSUtils.getFs(dfsBasePath, HoodieTestUtils.getDefaultHadoopConf());
    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(fs.getConf(), dfsBasePath);
-    HoodieTimeline timeline = new HoodieActiveTimeline(metaClient)
-        .getCommitTimeline();
-    Dataset<Row> readRecords = HoodieClientTestUtils
-        .readCommit(dfsBasePath, sqlContext, timeline, readCommitTime);
+    HoodieTimeline timeline = new HoodieActiveTimeline(metaClient).getCommitTimeline();
+    Dataset<Row> readRecords = HoodieClientTestUtils.readCommit(dfsBasePath, sqlContext, timeline, readCommitTime);
    assertEquals("Should contain 100 records", readRecords.count(), records.size());

    // Write to local
@@ -138,8 +135,7 @@ public class TestMultiFS implements Serializable {
    HoodieWriteConfig localConfig = HoodieWriteConfig.newBuilder().withPath(tablePath)
        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
        .forTable(tableName).withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build())
-        .build();
+            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build()).build();
    HoodieWriteClient localWriteClient = new HoodieWriteClient(jsc, localConfig);

    String writeCommitTime = localWriteClient.startCommit();
@@ -153,8 +149,7 @@ public class TestMultiFS implements Serializable {
    fs = FSUtils.getFs(tablePath, HoodieTestUtils.getDefaultHadoopConf());
    metaClient = new HoodieTableMetaClient(fs.getConf(), tablePath);
    timeline = new HoodieActiveTimeline(metaClient).getCommitTimeline();
-    Dataset<Row> localReadRecords = HoodieClientTestUtils
-        .readCommit(tablePath, sqlContext, timeline, writeCommitTime);
+    Dataset<Row> localReadRecords = HoodieClientTestUtils.readCommit(tablePath, sqlContext, timeline, writeCommitTime);
    assertEquals("Should contain 100 records", localReadRecords.count(), localRecords.size());
  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieClientTestUtils.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieClientTestUtils.java
@@ -69,8 +69,7 @@ public class HoodieClientTestUtils {
    return keys;
  }

-  private static void fakeMetaFile(String basePath, String commitTime, String suffix)
-      throws IOException {
+  private static void fakeMetaFile(String basePath, String commitTime, String suffix) throws IOException {
    String parentPath = basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME;
    new File(parentPath).mkdirs();
    new File(parentPath + "/" + commitTime + suffix).createNewFile();
@@ -85,55 +84,48 @@ public class HoodieClientTestUtils {
    fakeMetaFile(basePath, commitTime, HoodieTimeline.INFLIGHT_EXTENSION);
  }

-  public static void fakeDataFile(String basePath, String partitionPath, String commitTime,
-      String fileId) throws Exception {
+  public static void fakeDataFile(String basePath, String partitionPath, String commitTime, String fileId)
+      throws Exception {
    fakeDataFile(basePath, partitionPath, commitTime, fileId, 0);
  }

-  public static void fakeDataFile(String basePath, String partitionPath, String commitTime,
-      String fileId, long length) throws Exception {
+  public static void fakeDataFile(String basePath, String partitionPath, String commitTime, String fileId, long length)
+      throws Exception {
    String parentPath = String.format("%s/%s", basePath, partitionPath);
    new File(parentPath).mkdirs();
-    String path = String
-        .format("%s/%s", parentPath, FSUtils.makeDataFileName(commitTime, 0, fileId));
+    String path = String.format("%s/%s", parentPath, FSUtils.makeDataFileName(commitTime, 0, fileId));
    new File(path).createNewFile();
    new RandomAccessFile(path, "rw").setLength(length);
  }

  public static SparkConf getSparkConfForTest(String appName) {
-    SparkConf sparkConf = new SparkConf()
-        .setAppName(appName)
+    System.out.println("HIII" + "HII2");
+    SparkConf sparkConf = new SparkConf().setAppName(appName)
        .set("spark.serializer", "org.apache.spark.serializer.KryoSerializer")
        .setMaster("local[1]");
    return HoodieReadClient.addHoodieSupport(sparkConf);
  }

-  public static HashMap<String, String> getLatestFileIDsToFullPath(String basePath,
-      HoodieTimeline commitTimeline,
+  public static HashMap<String, String> getLatestFileIDsToFullPath(String basePath, HoodieTimeline commitTimeline,
      List<HoodieInstant> commitsToReturn) throws IOException {
    HashMap<String, String> fileIdToFullPath = new HashMap<>();
    for (HoodieInstant commit : commitsToReturn) {
-      HoodieCommitMetadata metadata =
-          HoodieCommitMetadata.fromBytes(commitTimeline.getInstantDetails(commit).get());
+      HoodieCommitMetadata metadata = HoodieCommitMetadata.fromBytes(commitTimeline.getInstantDetails(commit).get());
      fileIdToFullPath.putAll(metadata.getFileIdAndFullPaths(basePath));
    }
    return fileIdToFullPath;
  }

-  public static Dataset<Row> readCommit(String basePath,
-      SQLContext sqlContext,
-      HoodieTimeline commitTimeline,
+  public static Dataset<Row> readCommit(String basePath, SQLContext sqlContext, HoodieTimeline commitTimeline,
      String commitTime) {
-    HoodieInstant commitInstant =
-        new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
+    HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
    if (!commitTimeline.containsInstant(commitInstant)) {
      new HoodieException("No commit exists at " + commitTime);
    }
    try {
      HashMap<String, String> paths = getLatestFileIDsToFullPath(basePath, commitTimeline,
          Arrays.asList(commitInstant));
-      return sqlContext.read()
-          .parquet(paths.values().toArray(new String[paths.size()]))
+      return sqlContext.read().parquet(paths.values().toArray(new String[paths.size()]))
          .filter(String.format("%s ='%s'", HoodieRecord.COMMIT_TIME_METADATA_FIELD, commitTime));
    } catch (Exception e) {
      throw new HoodieException("Error reading commit " + commitTime, e);
@@ -143,50 +135,37 @@ public class HoodieClientTestUtils {
  /**
   * Obtain all new data written into the Hoodie dataset since the given timestamp.
   */
-  public static Dataset<Row> readSince(String basePath,
-      SQLContext sqlContext,
-      HoodieTimeline commitTimeline,
+  public static Dataset<Row> readSince(String basePath, SQLContext sqlContext, HoodieTimeline commitTimeline,
      String lastCommitTime) {
-    List<HoodieInstant> commitsToReturn =
-        commitTimeline.findInstantsAfter(lastCommitTime, Integer.MAX_VALUE)
+    List<HoodieInstant> commitsToReturn = commitTimeline.findInstantsAfter(lastCommitTime, Integer.MAX_VALUE)
        .getInstants().collect(Collectors.toList());
    try {
      // Go over the commit metadata, and obtain the new files that need to be read.
-      HashMap<String, String> fileIdToFullPath = getLatestFileIDsToFullPath(basePath,
-          commitTimeline, commitsToReturn);
-      return sqlContext.read()
-          .parquet(fileIdToFullPath.values().toArray(new String[fileIdToFullPath.size()]))
-          .filter(
-              String.format("%s >'%s'", HoodieRecord.COMMIT_TIME_METADATA_FIELD, lastCommitTime));
+      HashMap<String, String> fileIdToFullPath = getLatestFileIDsToFullPath(basePath, commitTimeline, commitsToReturn);
+      return sqlContext.read().parquet(fileIdToFullPath.values().toArray(new String[fileIdToFullPath.size()]))
+          .filter(String.format("%s >'%s'", HoodieRecord.COMMIT_TIME_METADATA_FIELD, lastCommitTime));
    } catch (IOException e) {
-      throw new HoodieException(
-          "Error pulling data incrementally from commitTimestamp :" + lastCommitTime, e);
+      throw new HoodieException("Error pulling data incrementally from commitTimestamp :" + lastCommitTime, e);
    }
  }

  /**
   * Reads the paths under the a hoodie dataset out as a DataFrame
   */
-  public static Dataset<Row> read(String basePath,
-      SQLContext sqlContext,
-      FileSystem fs,
-      String... paths) {
+  public static Dataset<Row> read(String basePath, SQLContext sqlContext, FileSystem fs, String... paths) {
    List<String> filteredPaths = new ArrayList<>();
    try {
      HoodieTable hoodieTable = HoodieTable
          .getHoodieTable(new HoodieTableMetaClient(fs.getConf(), basePath, true), null);
      for (String path : paths) {
        TableFileSystemView.ReadOptimizedView fileSystemView = new HoodieTableFileSystemView(
-            hoodieTable.getMetaClient(),
-            hoodieTable.getCompletedCommitTimeline(), fs.globStatus(new Path(path)));
-        List<HoodieDataFile> latestFiles = fileSystemView.getLatestDataFiles().collect(
-            Collectors.toList());
+            hoodieTable.getMetaClient(), hoodieTable.getCompletedCommitTimeline(), fs.globStatus(new Path(path)));
+        List<HoodieDataFile> latestFiles = fileSystemView.getLatestDataFiles().collect(Collectors.toList());
        for (HoodieDataFile file : latestFiles) {
          filteredPaths.add(file.getPath());
        }
      }
-      return sqlContext.read()
-          .parquet(filteredPaths.toArray(new String[filteredPaths.size()]));
+      return sqlContext.read().parquet(filteredPaths.toArray(new String[filteredPaths.size()]));
    } catch (Exception e) {
      throw new HoodieException("Error reading hoodie dataset as a dataframe", e);
    }
--- a/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieMergeOnReadTestUtils.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieMergeOnReadTestUtils.java
@@ -42,8 +42,7 @@ import org.apache.hadoop.mapred.RecordReader;
 */
 public class HoodieMergeOnReadTestUtils {

-  public static List<GenericRecord> getRecordsUsingInputFormat(List<String> inputPaths,
-      String basePath)
+  public static List<GenericRecord> getRecordsUsingInputFormat(List<String> inputPaths, String basePath)
      throws IOException {
    JobConf jobConf = new JobConf();
    Schema schema = HoodieAvroUtils.addMetadataFields(Schema.parse(TRIP_EXAMPLE_SCHEMA));
@@ -59,7 +58,8 @@ public class HoodieMergeOnReadTestUtils {
        ArrayWritable writable = (ArrayWritable) recordReader.createValue();
        while (recordReader.next(key, writable)) {
          GenericRecordBuilder newRecord = new GenericRecordBuilder(schema);
-          // writable returns an array with [field1, field2, _hoodie_commit_time, _hoodie_commit_seqno]
+          // writable returns an array with [field1, field2, _hoodie_commit_time,
+          // _hoodie_commit_seqno]
          Writable[] values = writable.get();
          schema.getFields().forEach(field -> {
            newRecord.set(field, values[2]);
@@ -76,12 +76,11 @@ public class HoodieMergeOnReadTestUtils {
    }).get();
  }

-  private static void setPropsForInputFormat(HoodieRealtimeInputFormat inputFormat, JobConf jobConf,
-      Schema schema, String basePath) {
+  private static void setPropsForInputFormat(HoodieRealtimeInputFormat inputFormat, JobConf jobConf, Schema schema,
+      String basePath) {
    List<Schema.Field> fields = schema.getFields();
    String names = fields.stream().map(f -> f.name().toString()).collect(Collectors.joining(","));
-    String postions = fields.stream().map(f -> String.valueOf(f.pos()))
-        .collect(Collectors.joining(","));
+    String postions = fields.stream().map(f -> String.valueOf(f.pos())).collect(Collectors.joining(","));
    Configuration conf = HoodieTestUtils.getDefaultHadoopConf();
    jobConf.set(ColumnProjectionUtils.READ_COLUMN_NAMES_CONF_STR, names);
    jobConf.set(ColumnProjectionUtils.READ_COLUMN_IDS_CONF_STR, postions);
--- a/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieTestDataGenerator.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/common/HoodieTestDataGenerator.java
@@ -41,20 +41,15 @@ import org.apache.hadoop.fs.Path;

 /**
 * Class to be used in tests to keep generating test inserts and updates against a corpus.
- *
+ * <p>
 * Test data uses a toy Uber trips, data model.
 */
 public class HoodieTestDataGenerator {

-  static class KeyPartition {
-
-    HoodieKey key;
-    String partitionPath;
-  }
-
-  public static String TRIP_EXAMPLE_SCHEMA = "{\"type\": \"record\","
-      + "\"name\": \"triprec\","
-      + "\"fields\": [ "
+  // based on examination of sample file, the schema produces the following per record size
+  public static final int SIZE_PER_RECORD = 50 * 1024;
+  public static final String[] DEFAULT_PARTITION_PATHS = {"2016/03/15", "2015/03/16", "2015/03/17"};
+  public static String TRIP_EXAMPLE_SCHEMA = "{\"type\": \"record\"," + "\"name\": \"triprec\"," + "\"fields\": [ "
      + "{\"name\": \"timestamp\",\"type\": \"double\"},"
      + "{\"name\": \"_row_key\", \"type\": \"string\"},"
      + "{\"name\": \"rider\", \"type\": \"string\"},"
@@ -64,25 +59,9 @@ public class HoodieTestDataGenerator {
      + "{\"name\": \"end_lat\", \"type\": \"double\"},"
      + "{\"name\": \"end_lon\", \"type\": \"double\"},"
      + "{\"name\":\"fare\",\"type\": \"double\"}]}";
-
-  // based on examination of sample file, the schema produces the following per record size
-  public static final int SIZE_PER_RECORD = 50 * 1024;
-
-  public static final String[] DEFAULT_PARTITION_PATHS = {"2016/03/15", "2015/03/16", "2015/03/17"};
-
-
-  public static void writePartitionMetadata(FileSystem fs, String[] partitionPaths,
-      String basePath) {
-    for (String partitionPath : partitionPaths) {
-      new HoodiePartitionMetadata(fs, "000", new Path(basePath), new Path(basePath, partitionPath))
-          .trySave(0);
-    }
-  }
-
-  private List<KeyPartition> existingKeysList = new ArrayList<>();
-  public static Schema avroSchema = HoodieAvroUtils
-      .addMetadataFields(new Schema.Parser().parse(TRIP_EXAMPLE_SCHEMA));
+  public static Schema avroSchema = HoodieAvroUtils.addMetadataFields(new Schema.Parser().parse(TRIP_EXAMPLE_SCHEMA));
  private static Random rand = new Random(46474747);
+  private List<KeyPartition> existingKeysList = new ArrayList<>();
  private String[] partitionPaths = DEFAULT_PARTITION_PATHS;

  public HoodieTestDataGenerator(String[] partitionPaths) {
@@ -93,10 +72,66 @@ public class HoodieTestDataGenerator {
    this(new String[] {"2016/03/15", "2015/03/16", "2015/03/17"});
  }

+  public static void writePartitionMetadata(FileSystem fs, String[] partitionPaths, String basePath) {
+    for (String partitionPath : partitionPaths) {
+      new HoodiePartitionMetadata(fs, "000", new Path(basePath), new Path(basePath, partitionPath)).trySave(0);
+    }
+  }

  /**
-   * Generates new inserts, uniformly across the partition paths above. It also updates the list of
-   * existing keys.
+   * Generates a new avro record of the above schema format, retaining the key if optionally provided.
+   */
+  public static TestRawTripPayload generateRandomValue(HoodieKey key, String commitTime) throws IOException {
+    GenericRecord rec = generateGenericRecord(key.getRecordKey(), "rider-" + commitTime, "driver-" + commitTime, 0.0);
+    HoodieAvroUtils.addCommitMetadataToRecord(rec, commitTime, "-1");
+    return new TestRawTripPayload(rec.toString(), key.getRecordKey(), key.getPartitionPath(), TRIP_EXAMPLE_SCHEMA);
+  }
+
+  public static GenericRecord generateGenericRecord(String rowKey, String riderName, String driverName,
+      double timestamp) {
+    GenericRecord rec = new GenericData.Record(avroSchema);
+    rec.put("_row_key", rowKey);
+    rec.put("timestamp", timestamp);
+    rec.put("rider", riderName);
+    rec.put("driver", driverName);
+    rec.put("begin_lat", rand.nextDouble());
+    rec.put("begin_lon", rand.nextDouble());
+    rec.put("end_lat", rand.nextDouble());
+    rec.put("end_lon", rand.nextDouble());
+    rec.put("fare", rand.nextDouble() * 100);
+    return rec;
+  }
+
+  public static void createCommitFile(String basePath, String commitTime) throws IOException {
+    Path commitFile = new Path(
+        basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + HoodieTimeline.makeCommitFileName(commitTime));
+    FileSystem fs = FSUtils.getFs(basePath, HoodieTestUtils.getDefaultHadoopConf());
+    FSDataOutputStream os = fs.create(commitFile, true);
+    HoodieCommitMetadata commitMetadata = new HoodieCommitMetadata();
+    try {
+      // Write empty commit metadata
+      os.writeBytes(new String(commitMetadata.toJsonString().getBytes(StandardCharsets.UTF_8)));
+    } finally {
+      os.close();
+    }
+  }
+
+  public static void createSavepointFile(String basePath, String commitTime) throws IOException {
+    Path commitFile = new Path(basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME
+        + "/" + HoodieTimeline.makeSavePointFileName(commitTime));
+    FileSystem fs = FSUtils.getFs(basePath, HoodieTestUtils.getDefaultHadoopConf());
+    FSDataOutputStream os = fs.create(commitFile, true);
+    HoodieCommitMetadata commitMetadata = new HoodieCommitMetadata();
+    try {
+      // Write empty commit metadata
+      os.writeBytes(new String(commitMetadata.toJsonString().getBytes(StandardCharsets.UTF_8)));
+    } finally {
+      os.close();
+    }
+  }
+
+  /**
+   * Generates new inserts, uniformly across the partition paths above. It also updates the list of existing keys.
   */
  public List<HoodieRecord> generateInserts(String commitTime, int n) throws IOException {
    List<HoodieRecord> inserts = new ArrayList<>();
@@ -119,8 +154,7 @@ public class HoodieTestDataGenerator {
    return generateDeletesFromExistingRecords(inserts);
  }

-  public List<HoodieRecord> generateDeletesFromExistingRecords(List<HoodieRecord> existingRecords)
-      throws IOException {
+  public List<HoodieRecord> generateDeletesFromExistingRecords(List<HoodieRecord> existingRecords) throws IOException {
    List<HoodieRecord> deletes = new ArrayList<>();
    for (HoodieRecord existingRecord : existingRecords) {
      HoodieRecord record = generateDeleteRecord(existingRecord);
@@ -132,17 +166,15 @@ public class HoodieTestDataGenerator {

  public HoodieRecord generateDeleteRecord(HoodieRecord existingRecord) throws IOException {
    HoodieKey key = existingRecord.getKey();
-    TestRawTripPayload payload = new TestRawTripPayload(Optional.empty(), key.getRecordKey(),
-        key.getPartitionPath(), null, true);
+    TestRawTripPayload payload = new TestRawTripPayload(Optional.empty(), key.getRecordKey(), key.getPartitionPath(),
+        null, true);
    return new HoodieRecord(key, payload);
  }

-  public List<HoodieRecord> generateUpdates(String commitTime, List<HoodieRecord> baseRecords)
-      throws IOException {
+  public List<HoodieRecord> generateUpdates(String commitTime, List<HoodieRecord> baseRecords) throws IOException {
    List<HoodieRecord> updates = new ArrayList<>();
    for (HoodieRecord baseRecord : baseRecords) {
-      HoodieRecord record = new HoodieRecord(baseRecord.getKey(),
-          generateRandomValue(baseRecord.getKey(), commitTime));
+      HoodieRecord record = new HoodieRecord(baseRecord.getKey(), generateRandomValue(baseRecord.getKey(), commitTime));
      updates.add(record);
    }
    return updates;
@@ -161,68 +193,13 @@ public class HoodieTestDataGenerator {
    return updates;
  }

-
-  /**
-   * Generates a new avro record of the above schema format, retaining the key if optionally
-   * provided.
-   */
-  public static TestRawTripPayload generateRandomValue(HoodieKey key, String commitTime)
-      throws IOException {
-    GenericRecord rec = generateGenericRecord(key.getRecordKey(), "rider-" + commitTime,
-        "driver-" + commitTime, 0.0);
-    HoodieAvroUtils.addCommitMetadataToRecord(rec, commitTime, "-1");
-    return new TestRawTripPayload(rec.toString(), key.getRecordKey(), key.getPartitionPath(),
-        TRIP_EXAMPLE_SCHEMA);
-  }
-
-  public static GenericRecord generateGenericRecord(String rowKey, String riderName,
-      String driverName, double timestamp) {
-    GenericRecord rec = new GenericData.Record(avroSchema);
-    rec.put("_row_key", rowKey);
-    rec.put("timestamp", timestamp);
-    rec.put("rider", riderName);
-    rec.put("driver", driverName);
-    rec.put("begin_lat", rand.nextDouble());
-    rec.put("begin_lon", rand.nextDouble());
-    rec.put("end_lat", rand.nextDouble());
-    rec.put("end_lon", rand.nextDouble());
-    rec.put("fare", rand.nextDouble() * 100);
-    return rec;
-  }
-
-  public static void createCommitFile(String basePath, String commitTime) throws IOException {
-    Path commitFile =
-        new Path(basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + HoodieTimeline
-            .makeCommitFileName(commitTime));
-    FileSystem fs = FSUtils.getFs(basePath, HoodieTestUtils.getDefaultHadoopConf());
-    FSDataOutputStream os = fs.create(commitFile, true);
-    HoodieCommitMetadata commitMetadata = new HoodieCommitMetadata();
-    try {
-      // Write empty commit metadata
-      os.writeBytes(new String(commitMetadata.toJsonString().getBytes(
-          StandardCharsets.UTF_8)));
-    } finally {
-      os.close();
-    }
-  }
-
-  public static void createSavepointFile(String basePath, String commitTime) throws IOException {
-    Path commitFile =
-        new Path(basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + HoodieTimeline
-            .makeSavePointFileName(commitTime));
-    FileSystem fs = FSUtils.getFs(basePath, HoodieTestUtils.getDefaultHadoopConf());
-    FSDataOutputStream os = fs.create(commitFile, true);
-    HoodieCommitMetadata commitMetadata = new HoodieCommitMetadata();
-    try {
-      // Write empty commit metadata
-      os.writeBytes(new String(commitMetadata.toJsonString().getBytes(
-          StandardCharsets.UTF_8)));
-    } finally {
-      os.close();
-    }
-  }
-
  public String[] getPartitionPaths() {
    return partitionPaths;
  }
+
+  static class KeyPartition {
+
+    HoodieKey key;
+    String partitionPath;
+  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/common/TestRawTripPayload.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/common/TestRawTripPayload.java
@@ -43,15 +43,15 @@ import org.apache.commons.io.IOUtils;
 */
 public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayload> {

-  private transient static final ObjectMapper mapper = new ObjectMapper();
+  private static final transient ObjectMapper mapper = new ObjectMapper();
  private String partitionPath;
  private String rowKey;
  private byte[] jsonDataCompressed;
  private int dataSize;
  private boolean isDeleted;

-  public TestRawTripPayload(Optional<String> jsonData, String rowKey, String partitionPath,
-      String schemaStr, Boolean isDeleted) throws IOException {
+  public TestRawTripPayload(Optional<String> jsonData, String rowKey, String partitionPath, String schemaStr,
+      Boolean isDeleted) throws IOException {
    if (jsonData.isPresent()) {
      this.jsonDataCompressed = compressData(jsonData.get());
      this.dataSize = jsonData.get().length();
@@ -61,8 +61,7 @@ public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayloa
    this.isDeleted = isDeleted;
  }

-  public TestRawTripPayload(String jsonData, String rowKey, String partitionPath,
-      String schemaStr) throws IOException {
+  public TestRawTripPayload(String jsonData, String rowKey, String partitionPath, String schemaStr) throws IOException {
    this(Optional.of(jsonData), rowKey, partitionPath, schemaStr, false);
  }

@@ -86,8 +85,7 @@ public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayloa
  }

  @Override
-  public Optional<IndexedRecord> combineAndGetUpdateValue(IndexedRecord oldRec, Schema schema)
-      throws IOException {
+  public Optional<IndexedRecord> combineAndGetUpdateValue(IndexedRecord oldRec, Schema schema) throws IOException {
    return this.getInsertValue(schema);
  }

@@ -120,8 +118,7 @@ public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayloa

  private byte[] compressData(String jsonData) throws IOException {
    ByteArrayOutputStream baos = new ByteArrayOutputStream();
-    DeflaterOutputStream dos =
-        new DeflaterOutputStream(baos, new Deflater(Deflater.BEST_COMPRESSION), true);
+    DeflaterOutputStream dos = new DeflaterOutputStream(baos, new Deflater(Deflater.BEST_COMPRESSION), true);
    try {
      dos.write(jsonData.getBytes());
    } finally {
@@ -140,13 +137,36 @@ public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayloa
  }

  /**
-   * A custom {@link WriteStatus} that merges passed metadata key value map to {@code
-   * WriteStatus.markSuccess()} and {@code WriteStatus.markFailure()}.
+   * A custom {@link WriteStatus} that merges passed metadata key value map to {@code WriteStatus.markSuccess()} and
+   * {@code WriteStatus.markFailure()}.
   */
  public static class MetadataMergeWriteStatus extends WriteStatus {

    private Map<String, String> mergedMetadataMap = new HashMap<>();

+    public static Map<String, String> mergeMetadataForWriteStatuses(List<WriteStatus> writeStatuses) {
+      Map<String, String> allWriteStatusMergedMetadataMap = new HashMap<>();
+      for (WriteStatus writeStatus : writeStatuses) {
+        MetadataMergeWriteStatus.mergeMetadataMaps(((MetadataMergeWriteStatus) writeStatus).getMergedMetadataMap(),
+            allWriteStatusMergedMetadataMap);
+      }
+      return allWriteStatusMergedMetadataMap;
+    }
+
+    private static void mergeMetadataMaps(Map<String, String> mergeFromMap, Map<String, String> mergeToMap) {
+      for (Entry<String, String> entry : mergeFromMap.entrySet()) {
+        String key = entry.getKey();
+        if (!mergeToMap.containsKey(key)) {
+          mergeToMap.put(key, "0");
+        }
+        mergeToMap.put(key, addStrsAsInt(entry.getValue(), mergeToMap.get(key)));
+      }
+    }
+
+    private static String addStrsAsInt(String a, String b) {
+      return String.valueOf(Integer.parseInt(a) + Integer.parseInt(b));
+    }
+
    @Override
    public void markSuccess(HoodieRecord record, Optional<Map<String, String>> recordMetadata) {
      super.markSuccess(record, recordMetadata);
@@ -156,43 +176,15 @@ public class TestRawTripPayload implements HoodieRecordPayload<TestRawTripPayloa
    }

    @Override
-    public void markFailure(HoodieRecord record, Throwable t,
-        Optional<Map<String, String>> recordMetadata) {
+    public void markFailure(HoodieRecord record, Throwable t, Optional<Map<String, String>> recordMetadata) {
      super.markFailure(record, t, recordMetadata);
      if (recordMetadata.isPresent()) {
        mergeMetadataMaps(recordMetadata.get(), mergedMetadataMap);
      }
    }

-    public static Map<String, String> mergeMetadataForWriteStatuses(
-        List<WriteStatus> writeStatuses) {
-      Map<String, String> allWriteStatusMergedMetadataMap = new HashMap<>();
-      for (WriteStatus writeStatus : writeStatuses) {
-        MetadataMergeWriteStatus.mergeMetadataMaps(
-            ((MetadataMergeWriteStatus) writeStatus).getMergedMetadataMap(),
-            allWriteStatusMergedMetadataMap);
-      }
-      return allWriteStatusMergedMetadataMap;
-    }
-
-    private static void mergeMetadataMaps(Map<String, String> mergeFromMap,
-        Map<String, String> mergeToMap) {
-      for (Entry<String, String> entry : mergeFromMap.entrySet()) {
-        String key = entry.getKey();
-        if (!mergeToMap.containsKey(key)) {
-          mergeToMap.put(key, "0");
-        }
-        mergeToMap
-            .put(key, addStrsAsInt(entry.getValue(), mergeToMap.get(key)));
-      }
-    }
-
    private Map<String, String> getMergedMetadataMap() {
      return mergedMetadataMap;
    }
-
-    private static String addStrsAsInt(String a, String b) {
-      return String.valueOf(Integer.parseInt(a) + Integer.parseInt(b));
-    }
  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/config/HoodieWriteConfigTest.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/config/HoodieWriteConfigTest.java
@@ -49,8 +49,7 @@ public class HoodieWriteConfigTest {
    assertEquals(config.getMinCommitsToKeep(), 2);
  }

-  private ByteArrayOutputStream saveParamsIntoOutputStream(Map<String, String> params)
-      throws IOException {
+  private ByteArrayOutputStream saveParamsIntoOutputStream(Map<String, String> params) throws IOException {
    Properties properties = new Properties();
    properties.putAll(params);
    ByteArrayOutputStream outStream = new ByteArrayOutputStream();
--- a/hoodie-client/src/test/java/com/uber/hoodie/func/TestBufferedIterator.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/func/TestBufferedIterator.java
@@ -16,18 +16,13 @@

 package com.uber.hoodie.func;

+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.when;
+
 import com.uber.hoodie.common.HoodieTestDataGenerator;
 import com.uber.hoodie.common.model.HoodieRecord;
 import com.uber.hoodie.common.table.timeline.HoodieActiveTimeline;
 import com.uber.hoodie.exception.HoodieException;
-import org.apache.avro.generic.IndexedRecord;
-import org.apache.commons.io.FileUtils;
-import org.apache.spark.util.SizeEstimator;
-import org.junit.After;
-import org.junit.Assert;
-import org.junit.Before;
-import org.junit.Test;
-
 import java.io.IOException;
 import java.util.Iterator;
 import java.util.List;
@@ -37,9 +32,13 @@ import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
 import java.util.concurrent.Future;
 import java.util.concurrent.Semaphore;
-
-import static org.mockito.Mockito.mock;
-import static org.mockito.Mockito.when;
+import org.apache.avro.generic.IndexedRecord;
+import org.apache.commons.io.FileUtils;
+import org.apache.spark.util.SizeEstimator;
+import org.junit.After;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;

 public class TestBufferedIterator {

@@ -60,26 +59,24 @@ public class TestBufferedIterator {
    }
  }

-    // Test to ensure that we are reading all records from buffered iterator in the same order without any exceptions.
+  // Test to ensure that we are reading all records from buffered iterator in the same order
+  // without any exceptions.
  @Test(timeout = 60000)
  public void testRecordReading() throws IOException, ExecutionException, InterruptedException {
    final int numRecords = 128;
    final List<HoodieRecord> hoodieRecords = hoodieTestDataGenerator.generateInserts(commitTime, numRecords);
-        final BufferedIterator bufferedIterator =
-            new BufferedIterator(hoodieRecords.iterator(), FileUtils.ONE_KB, HoodieTestDataGenerator.avroSchema);
-        Future<Boolean> result =
-            recordReader.submit(
-                () -> {
+    final BufferedIterator bufferedIterator = new BufferedIterator(hoodieRecords.iterator(), FileUtils.ONE_KB,
+        HoodieTestDataGenerator.avroSchema);
+    Future<Boolean> result = recordReader.submit(() -> {
      bufferedIterator.startBuffering();
      return true;
-                }
-            );
+    });
    final Iterator<HoodieRecord> originalRecordIterator = hoodieRecords.iterator();
    int recordsRead = 0;
    while (bufferedIterator.hasNext()) {
      final HoodieRecord originalRecord = originalRecordIterator.next();
-            final Optional<IndexedRecord> originalInsertValue =
-                originalRecord.getData().getInsertValue(HoodieTestDataGenerator.avroSchema);
+      final Optional<IndexedRecord> originalInsertValue = originalRecord.getData()
+          .getInsertValue(HoodieTestDataGenerator.avroSchema);
      final BufferedIterator.BufferedIteratorPayload payload = bufferedIterator.next();
      // Ensure that record ordering is guaranteed.
      Assert.assertEquals(originalRecord, payload.record);
@@ -102,15 +99,12 @@ public class TestBufferedIterator {
    // maximum number of records to keep in memory.
    final int recordLimit = 5;
    final long memoryLimitInBytes = recordLimit * SizeEstimator.estimate(hoodieRecords.get(0));
-        final BufferedIterator bufferedIterator =
-            new BufferedIterator(hoodieRecords.iterator(), memoryLimitInBytes, HoodieTestDataGenerator.avroSchema);
-        Future<Boolean> result =
-            recordReader.submit(
-                () -> {
+    final BufferedIterator bufferedIterator = new BufferedIterator(hoodieRecords.iterator(), memoryLimitInBytes,
+        HoodieTestDataGenerator.avroSchema);
+    Future<Boolean> result = recordReader.submit(() -> {
      bufferedIterator.startBuffering();
      return true;
-                }
-            );
+    });
    // waiting for permits to expire.
    while (!isQueueFull(bufferedIterator.rateLimiter)) {
      Thread.sleep(10);
@@ -128,7 +122,8 @@ public class TestBufferedIterator {
    while (!isQueueFull(bufferedIterator.rateLimiter)) {
      Thread.sleep(10);
    }
-        // No change is expected in rate limit or number of buffered records. We only expect buffering thread to read
+    // No change is expected in rate limit or number of buffered records. We only expect
+    // buffering thread to read
    // 2 more records into the buffer.
    Assert.assertEquals(0, bufferedIterator.rateLimiter.availablePermits());
    Assert.assertEquals(recordLimit, bufferedIterator.currentRateLimit);
@@ -136,7 +131,8 @@ public class TestBufferedIterator {
    Assert.assertEquals(recordLimit - 1 + 2, bufferedIterator.samplingRecordCounter.get());
  }

-    // Test to ensure that exception in either buffering thread or BufferedIterator-reader thread is propagated to
+  // Test to ensure that exception in either buffering thread or BufferedIterator-reader thread
+  // is propagated to
  // another thread.
  @Test(timeout = 60000)
  public void testException() throws IOException, InterruptedException {
@@ -145,17 +141,15 @@ public class TestBufferedIterator {
    // buffer memory limit
    final long memoryLimitInBytes = 4 * SizeEstimator.estimate(hoodieRecords.get(0));

-        // first let us throw exception from bufferIterator reader and test that buffering thread stops and throws
+    // first let us throw exception from bufferIterator reader and test that buffering thread
+    // stops and throws
    // correct exception back.
-        BufferedIterator bufferedIterator1 =
-            new BufferedIterator(hoodieRecords.iterator(), memoryLimitInBytes, HoodieTestDataGenerator.avroSchema);
-        Future<Boolean> result =
-            recordReader.submit(
-                () -> {
+    BufferedIterator bufferedIterator1 = new BufferedIterator(hoodieRecords.iterator(), memoryLimitInBytes,
+        HoodieTestDataGenerator.avroSchema);
+    Future<Boolean> result = recordReader.submit(() -> {
      bufferedIterator1.startBuffering();
      return true;
-                }
-            );
+    });
    // waiting for permits to expire.
    while (!isQueueFull(bufferedIterator1.rateLimiter)) {
      Thread.sleep(10);
@@ -171,21 +165,19 @@ public class TestBufferedIterator {
      Assert.assertEquals(e, e1.getCause().getCause());
    }

-        // second let us raise an exception while doing record buffering. this exception should get propagated to
+    // second let us raise an exception while doing record buffering. this exception should get
+    // propagated to
    // buffered iterator reader.
    final RuntimeException expectedException = new RuntimeException("failing record reading");
    final Iterator<HoodieRecord> mockHoodieRecordsIterator = mock(Iterator.class);
    when(mockHoodieRecordsIterator.hasNext()).thenReturn(true);
    when(mockHoodieRecordsIterator.next()).thenThrow(expectedException);
-        BufferedIterator bufferedIterator2 =
-            new BufferedIterator(mockHoodieRecordsIterator, memoryLimitInBytes, HoodieTestDataGenerator.avroSchema);
-        Future<Boolean> result2 =
-            recordReader.submit(
-                () -> {
+    BufferedIterator bufferedIterator2 = new BufferedIterator(mockHoodieRecordsIterator, memoryLimitInBytes,
+        HoodieTestDataGenerator.avroSchema);
+    Future<Boolean> result2 = recordReader.submit(() -> {
      bufferedIterator2.startBuffering();
      return true;
-                }
-            );
+    });
    try {
      bufferedIterator2.hasNext();
      Assert.fail("exception is expected");
--- a/hoodie-client/src/test/java/com/uber/hoodie/func/TestUpdateMapFunction.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/func/TestUpdateMapFunction.java
@@ -55,32 +55,24 @@ public class TestUpdateMapFunction {
  public void testSchemaEvolutionOnUpdate() throws Exception {
    // Create a bunch of records with a old version of schema
    HoodieWriteConfig config = makeHoodieClientConfig("/exampleSchema.txt");
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(
-        HoodieTestUtils.getDefaultHadoopConf(), basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(HoodieTestUtils.getDefaultHadoopConf(), basePath);
    HoodieCopyOnWriteTable table = new HoodieCopyOnWriteTable(config, metaClient);

-    String recordStr1 =
-        "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 =
-        "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 =
-        "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
    List<HoodieRecord> records = new ArrayList<>();
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
-            rowChange1));
+    records.add(new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1));
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
-            rowChange2));
+    records.add(new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2));
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
-            rowChange3));
+    records.add(new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3));
    Iterator<List<WriteStatus>> insertResult = table.handleInsert("100", records.iterator());
-    Path commitFile =
-        new Path(config.getBasePath() + "/.hoodie/" + HoodieTimeline.makeCommitFileName("100"));
+    Path commitFile = new Path(config.getBasePath() + "/.hoodie/" + HoodieTimeline.makeCommitFileName("100"));
    FSUtils.getFs(basePath, HoodieTestUtils.getDefaultHadoopConf()).create(commitFile);

    // Now try an update with an evolved schema
@@ -92,12 +84,11 @@ public class TestUpdateMapFunction {

    table = new HoodieCopyOnWriteTable(config, metaClient);
    // New content with values for the newly added field
-    recordStr1 =
-        "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12,\"added_field\":1}";
+    recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12,\"added_field\":1}";
    records = new ArrayList<>();
    rowChange1 = new TestRawTripPayload(recordStr1);
-    HoodieRecord record1 =
-        new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
        rowChange1);
    record1.setCurrentLocation(new HoodieRecordLocation("100", fileId));
    records.add(record1);
@@ -105,8 +96,8 @@ public class TestUpdateMapFunction {
    try {
      table.handleUpdate("101", fileId, records.iterator());
    } catch (ClassCastException e) {
-      fail(
-          "UpdateFunction could not read records written with exampleSchema.txt using the exampleEvolvedSchema.txt");
+      fail("UpdateFunction could not read records written with exampleSchema.txt using the "
+          + "exampleEvolvedSchema.txt");
    }
  }

--- a/hoodie-client/src/test/java/com/uber/hoodie/index/TestHbaseIndex.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/index/TestHbaseIndex.java
@@ -16,6 +16,12 @@

 package com.uber.hoodie.index;

+import static org.junit.Assert.assertFalse;
+import static org.junit.Assert.assertTrue;
+import static org.mockito.Matchers.anyObject;
+import static org.mockito.Mockito.atMost;
+import static org.mockito.Mockito.times;
+
 import com.uber.hoodie.HoodieWriteClient;
 import com.uber.hoodie.WriteStatus;
 import com.uber.hoodie.common.HoodieTestDataGenerator;
@@ -23,19 +29,16 @@ import com.uber.hoodie.common.model.HoodieRecord;
 import com.uber.hoodie.common.model.HoodieTableType;
 import com.uber.hoodie.common.table.HoodieTableConfig;
 import com.uber.hoodie.common.table.HoodieTableMetaClient;
-import com.uber.hoodie.common.table.TableFileSystemView;
-import com.uber.hoodie.common.table.view.HoodieTableFileSystemView;
-import com.uber.hoodie.common.util.FSUtils;
 import com.uber.hoodie.config.HoodieCompactionConfig;
 import com.uber.hoodie.config.HoodieIndexConfig;
 import com.uber.hoodie.config.HoodieStorageConfig;
 import com.uber.hoodie.config.HoodieWriteConfig;
 import com.uber.hoodie.index.hbase.HBaseIndex;
 import com.uber.hoodie.table.HoodieTable;
+import java.io.File;
+import java.util.List;
 import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.FileStatus;
 import org.apache.hadoop.fs.FileSystem;
-import org.apache.hadoop.fs.Path;
 import org.apache.hadoop.hbase.HBaseTestingUtility;
 import org.apache.hadoop.hbase.TableName;
 import org.apache.hadoop.hbase.client.Connection;
@@ -56,37 +59,26 @@ import org.junit.Test;
 import org.junit.rules.TemporaryFolder;
 import org.junit.runners.MethodSorters;
 import org.mockito.Mockito;
-import scala.Tuple2;
-
-import java.io.File;
-import java.io.IOException;
-import java.util.List;
-
-import static org.junit.Assert.assertEquals;
-import static org.junit.Assert.assertFalse;
-import static org.junit.Assert.assertTrue;
-import static org.mockito.Matchers.anyObject;
-import static org.mockito.Mockito.atLeast;
-import static org.mockito.Mockito.atMost;
-import static org.mockito.Mockito.times;

 /**
- * Note :: HBaseTestingUtility is really flaky with issues where the HbaseMiniCluster fails to shutdown
- * across tests, (see one problem here : https://issues.apache.org/jira/browse/HBASE-15835).
- * Hence, the need to use MethodSorters.NAME_ASCENDING to make sure the tests run in order. Please alter
- * the order of tests running carefully.
+ * Note :: HBaseTestingUtility is really flaky with issues where the HbaseMiniCluster fails to shutdown across tests,
+ * (see one problem here : https://issues.apache .org/jira/browse/HBASE-15835). Hence, the need to use
+ * MethodSorters.NAME_ASCENDING to make sure the tests run in order. Please alter the order of tests running carefully.
 */
@FixMethodOrder(MethodSorters.NAME_ASCENDING)
 public class TestHbaseIndex {

  private static JavaSparkContext jsc = null;
-  private String basePath = null;
-  private transient FileSystem fs;
  private static HBaseTestingUtility utility;
  private static Configuration hbaseConfig;
  private static String tableName = "test_table";
+  private String basePath = null;
+  private transient FileSystem fs;
  private HoodieTableMetaClient metaClient;

+  public TestHbaseIndex() throws Exception {
+  }
+
  @AfterClass
  public static void clean() throws Exception {
    if (jsc != null) {
@@ -97,6 +89,20 @@ public class TestHbaseIndex {
    }
  }

+  @BeforeClass
+  public static void init() throws Exception {
+
+    // Initialize HbaseMiniCluster
+    utility = new HBaseTestingUtility();
+    utility.startMiniCluster();
+    hbaseConfig = utility.getConnection().getConfiguration();
+    utility.createTable(TableName.valueOf(tableName), Bytes.toBytes("_s"));
+    // Initialize a local spark env
+    SparkConf sparkConf = new SparkConf().setAppName("TestHbaseIndex").setMaster("local[1]");
+    jsc = new JavaSparkContext(sparkConf);
+    jsc.hadoopConfiguration().addResource(utility.getConfiguration());
+  }
+
  @After
  public void clear() throws Exception {
    if (basePath != null) {
@@ -112,25 +118,8 @@ public class TestHbaseIndex {
    basePath = folder.getRoot().getAbsolutePath();
    // Initialize table
    metaClient = HoodieTableMetaClient
-        .initTableType(utility.getConfiguration(), basePath, HoodieTableType.COPY_ON_WRITE,
-            tableName, HoodieTableConfig.DEFAULT_PAYLOAD_CLASS);
-  }
-
-  public TestHbaseIndex() throws Exception {
-  }
-
-  @BeforeClass
-  public static void init() throws Exception {
-
-    // Initialize HbaseMiniCluster
-    utility = new HBaseTestingUtility();
-    utility.startMiniCluster();
-    hbaseConfig = utility.getConnection().getConfiguration();
-    utility.createTable(TableName.valueOf(tableName), Bytes.toBytes("_s"));
-    // Initialize a local spark env
-    SparkConf sparkConf = new SparkConf().setAppName("TestHbaseIndex").setMaster("local[1]");
-    jsc = new JavaSparkContext(sparkConf);
-    jsc.hadoopConfiguration().addResource(utility.getConfiguration());
+        .initTableType(utility.getConfiguration(), basePath, HoodieTableType.COPY_ON_WRITE, tableName,
+            HoodieTableConfig.DEFAULT_PAYLOAD_CLASS);
  }

  @Test
@@ -156,7 +145,8 @@ public class TestHbaseIndex {
    JavaRDD<WriteStatus> writeStatues = writeClient.upsert(writeRecords, newCommitTime);
    assertNoWriteErrors(writeStatues.collect());

-    // Now tagLocation for these records, hbaseIndex should not tag them since it was a failed commit
+    // Now tagLocation for these records, hbaseIndex should not tag them since it was a failed
+    // commit
    javaRDD = index.tagLocation(writeRecords, hoodieTable);
    assert (javaRDD.filter(record -> record.isCurrentLocationKnown()).collect().size() == 0);

@@ -167,8 +157,9 @@ public class TestHbaseIndex {
    javaRDD = index.tagLocation(writeRecords, hoodieTable);
    assertTrue(javaRDD.filter(record -> record.isCurrentLocationKnown()).collect().size() == 200);
    assertTrue(javaRDD.map(record -> record.getKey().getRecordKey()).distinct().count() == 200);
-    assertTrue(javaRDD.filter(record -> (record.getCurrentLocation() != null
-        && record.getCurrentLocation().getCommitTime().equals(newCommitTime))).distinct().count() == 200);
+    assertTrue(javaRDD.filter(
+        record -> (record.getCurrentLocation() != null && record.getCurrentLocation().getCommitTime()
+            .equals(newCommitTime))).distinct().count() == 200);

  }

@@ -208,7 +199,8 @@ public class TestHbaseIndex {
    // Rollback the last commit
    writeClient.rollback(newCommitTime);

-    // Now tagLocation for these records, hbaseIndex should not tag them since it was a rolled back commit
+    // Now tagLocation for these records, hbaseIndex should not tag them since it was a rolled
+    // back commit
    javaRDD = index.tagLocation(writeRecords, hoodieTable);
    assert (javaRDD.filter(record -> record.isCurrentLocationKnown()).collect().size() == 0);
    assert (javaRDD.filter(record -> record.getCurrentLocation() != null).collect().size() == 0);
@@ -302,12 +294,10 @@ public class TestHbaseIndex {
  }

  private HoodieWriteConfig.Builder getConfigBuilder() {
-    return HoodieWriteConfig.newBuilder().withPath(basePath)
-        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(1, 1)
-        .withCompactionConfig(
-            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024)
-                .withInlineCompaction(false).build())
-        .withAutoCommit(false)
+    return HoodieWriteConfig.newBuilder().withPath(basePath).withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA)
+        .withParallelism(1, 1).withCompactionConfig(
+            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024).withInlineCompaction(false)
+                .build()).withAutoCommit(false)
        .withStorageConfig(HoodieStorageConfig.newBuilder().limitFileSize(1024 * 1024).build())
        .forTable("test-trip-table").withIndexConfig(
            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.HBASE)
--- a/hoodie-client/src/test/java/com/uber/hoodie/index/TestHoodieIndex.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/index/TestHoodieIndex.java
@@ -31,16 +31,14 @@ public class TestHoodieIndex {
    HoodieWriteConfig.Builder clientConfigBuilder = HoodieWriteConfig.newBuilder();
    HoodieIndexConfig.Builder indexConfigBuilder = HoodieIndexConfig.newBuilder();
    // Different types
-    HoodieWriteConfig config = clientConfigBuilder.withPath("")
-        .withIndexConfig(indexConfigBuilder.withIndexType(HoodieIndex.IndexType.HBASE).build())
-        .build();
+    HoodieWriteConfig config = clientConfigBuilder.withPath("").withIndexConfig(
+        indexConfigBuilder.withIndexType(HoodieIndex.IndexType.HBASE).build()).build();
    assertTrue(HoodieIndex.createIndex(config, null) instanceof HBaseIndex);
-    config = clientConfigBuilder.withPath("").withIndexConfig(
-        indexConfigBuilder.withIndexType(HoodieIndex.IndexType.INMEMORY).build()).build();
+    config = clientConfigBuilder.withPath("")
+        .withIndexConfig(indexConfigBuilder.withIndexType(HoodieIndex.IndexType.INMEMORY).build()).build();
    assertTrue(HoodieIndex.createIndex(config, null) instanceof InMemoryHashIndex);
    config = clientConfigBuilder.withPath("")
-        .withIndexConfig(indexConfigBuilder.withIndexType(HoodieIndex.IndexType.BLOOM).build())
-        .build();
+        .withIndexConfig(indexConfigBuilder.withIndexType(HoodieIndex.IndexType.BLOOM).build()).build();
    assertTrue(HoodieIndex.createIndex(config, null) instanceof HoodieBloomIndex);
  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/index/bloom/TestHoodieBloomIndex.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/index/bloom/TestHoodieBloomIndex.java
@@ -98,31 +98,33 @@ public class TestHoodieBloomIndex {
  @Test
  public void testLoadUUIDsInMemory() throws IOException {
    // Create one RDD of hoodie record
-    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
-    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";
+    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";

    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    HoodieRecord record1 = new HoodieRecord(
-        new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1);
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+        rowChange1);
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    HoodieRecord record2 = new HoodieRecord(
-        new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2);
+    HoodieRecord record2 = new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
+        rowChange2);
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    HoodieRecord record3 = new HoodieRecord(
-        new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3);
+    HoodieRecord record3 = new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
+        rowChange3);
    TestRawTripPayload rowChange4 = new TestRawTripPayload(recordStr4);
-    HoodieRecord record4 = new HoodieRecord(
-        new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()), rowChange4);
+    HoodieRecord record4 = new HoodieRecord(new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()),
+        rowChange4);

-    JavaRDD<HoodieRecord> recordRDD = jsc
-        .parallelize(Arrays.asList(record1, record2, record3, record4));
+    JavaRDD<HoodieRecord> recordRDD = jsc.parallelize(Arrays.asList(record1, record2, record3, record4));

    // Load to memory
-    Map<String, Iterable<String>> map = recordRDD
-        .mapToPair(record -> new Tuple2<>(record.getPartitionPath(), record.getRecordKey()))
-        .groupByKey().collectAsMap();
+    Map<String, Iterable<String>> map = recordRDD.mapToPair(
+        record -> new Tuple2<>(record.getPartitionPath(), record.getRecordKey())).groupByKey().collectAsMap();
    assertEquals(map.size(), 2);
    List<String> list1 = Lists.newArrayList(map.get("2016/01/31"));
    List<String> list2 = Lists.newArrayList(map.get("2015/01/31"));
@@ -132,44 +134,40 @@ public class TestHoodieBloomIndex {

  @Test
  public void testLoadInvolvedFiles() throws IOException {
-    HoodieWriteConfig config = HoodieWriteConfig.newBuilder()
-        .withPath(basePath)
-        .build();
+    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath).build();
    HoodieBloomIndex index = new HoodieBloomIndex(config, jsc);

    // Create some partitions, and put some files
    // "2016/01/21": 0 file
    // "2016/04/01": 1 file (2_0_20160401010101.parquet)
-    // "2015/03/12": 3 files (1_0_20150312101010.parquet, 3_0_20150312101010.parquet, 4_0_20150312101010.parquet)
+    // "2015/03/12": 3 files (1_0_20150312101010.parquet, 3_0_20150312101010.parquet,
+    // 4_0_20150312101010.parquet)
    new File(basePath + "/2016/01/21").mkdirs();
    new File(basePath + "/2016/04/01").mkdirs();
    new File(basePath + "/2015/03/12").mkdirs();

    TestRawTripPayload rowChange1 = new TestRawTripPayload(
        "{\"_row_key\":\"000\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}");
-    HoodieRecord record1 = new HoodieRecord(
-        new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1);
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+        rowChange1);
    TestRawTripPayload rowChange2 = new TestRawTripPayload(
        "{\"_row_key\":\"001\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}");
-    HoodieRecord record2 = new HoodieRecord(
-        new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2);
+    HoodieRecord record2 = new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
+        rowChange2);
    TestRawTripPayload rowChange3 = new TestRawTripPayload(
        "{\"_row_key\":\"002\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}");
-    HoodieRecord record3 = new HoodieRecord(
-        new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3);
+    HoodieRecord record3 = new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
+        rowChange3);
    TestRawTripPayload rowChange4 = new TestRawTripPayload(
        "{\"_row_key\":\"003\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}");
-    HoodieRecord record4 = new HoodieRecord(
-        new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()), rowChange4);
+    HoodieRecord record4 = new HoodieRecord(new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()),
+        rowChange4);

-    writeParquetFile("2016/04/01", "2_0_20160401010101.parquet", Lists.newArrayList(), schema, null,
+    writeParquetFile("2016/04/01", "2_0_20160401010101.parquet", Lists.newArrayList(), schema, null, false);
+    writeParquetFile("2015/03/12", "1_0_20150312101010.parquet", Lists.newArrayList(), schema, null, false);
+    writeParquetFile("2015/03/12", "3_0_20150312101010.parquet", Arrays.asList(record1), schema, null, false);
+    writeParquetFile("2015/03/12", "4_0_20150312101010.parquet", Arrays.asList(record2, record3, record4), schema, null,
        false);
-    writeParquetFile("2015/03/12", "1_0_20150312101010.parquet", Lists.newArrayList(), schema, null,
-        false);
-    writeParquetFile("2015/03/12", "3_0_20150312101010.parquet", Arrays.asList(record1), schema,
-        null, false);
-    writeParquetFile("2015/03/12", "4_0_20150312101010.parquet",
-        Arrays.asList(record2, record3, record4), schema, null, false);

    List<String> partitions = Arrays.asList("2016/01/21", "2016/04/01", "2015/03/12");
    HoodieTableMetaClient metadata = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
@@ -198,51 +196,32 @@ public class TestHoodieBloomIndex {
    List<Tuple2<String, BloomIndexFileInfo>> expected = Arrays.asList(
        new Tuple2<>("2016/04/01", new BloomIndexFileInfo("2_0_20160401010101.parquet")),
        new Tuple2<>("2015/03/12", new BloomIndexFileInfo("1_0_20150312101010.parquet")),
-        new Tuple2<>("2015/03/12",
-            new BloomIndexFileInfo("3_0_20150312101010.parquet", "000", "000")),
-        new Tuple2<>("2015/03/12",
-            new BloomIndexFileInfo("4_0_20150312101010.parquet", "001", "003"))
-    );
+        new Tuple2<>("2015/03/12", new BloomIndexFileInfo("3_0_20150312101010.parquet", "000", "000")),
+        new Tuple2<>("2015/03/12", new BloomIndexFileInfo("4_0_20150312101010.parquet", "001", "003")));
    assertEquals(expected, filesList);
  }

  @Test
  public void testRangePruning() {

-    HoodieWriteConfig config = HoodieWriteConfig.newBuilder()
-        .withPath(basePath)
-        .build();
+    HoodieWriteConfig config = HoodieWriteConfig.newBuilder().withPath(basePath).build();
    HoodieBloomIndex index = new HoodieBloomIndex(config, jsc);

    final Map<String, List<BloomIndexFileInfo>> partitionToFileIndexInfo = new HashMap<>();
-    partitionToFileIndexInfo.put("2017/10/22", Arrays.asList(
-        new BloomIndexFileInfo("f1"),
-        new BloomIndexFileInfo("f2", "000", "000"),
-        new BloomIndexFileInfo("f3", "001", "003"),
-        new BloomIndexFileInfo("f4", "002", "007"),
-        new BloomIndexFileInfo("f5", "009", "010")
-    ));
+    partitionToFileIndexInfo.put("2017/10/22", Arrays.asList(new BloomIndexFileInfo("f1"),
+        new BloomIndexFileInfo("f2", "000", "000"), new BloomIndexFileInfo("f3", "001", "003"),
+        new BloomIndexFileInfo("f4", "002", "007"), new BloomIndexFileInfo("f5", "009", "010")));

-    JavaPairRDD<String, String> partitionRecordKeyPairRDD = jsc
-        .parallelize(Arrays.asList(
-            new Tuple2<>("2017/10/22", "003"),
-            new Tuple2<>("2017/10/22", "002"),
-            new Tuple2<>("2017/10/22", "005"),
-            new Tuple2<>("2017/10/22", "004")
-        ))
-        .mapToPair(t -> t);
+    JavaPairRDD<String, String> partitionRecordKeyPairRDD = jsc.parallelize(Arrays.asList(
+        new Tuple2<>("2017/10/22", "003"), new Tuple2<>("2017/10/22", "002"), new Tuple2<>("2017/10/22", "005"),
+        new Tuple2<>("2017/10/22", "004"))).mapToPair(t -> t);

-    List<Tuple2<String, Tuple2<String, HoodieKey>>> comparisonKeyList = index
-        .explodeRecordRDDWithFileComparisons(partitionToFileIndexInfo, partitionRecordKeyPairRDD)
-        .collect();
+    List<Tuple2<String, Tuple2<String, HoodieKey>>> comparisonKeyList = index.explodeRecordRDDWithFileComparisons(
+        partitionToFileIndexInfo, partitionRecordKeyPairRDD).collect();

    assertEquals(10, comparisonKeyList.size());
-    Map<String, List<String>> recordKeyToFileComps = comparisonKeyList.stream()
-        .collect(Collectors.groupingBy(
-            t -> t._2()._2().getRecordKey(),
-            Collectors.mapping(t -> t._2()._1().split("#")[0], Collectors.toList()
-            )
-        ));
+    Map<String, List<String>> recordKeyToFileComps = comparisonKeyList.stream().collect(Collectors.groupingBy(
+        t -> t._2()._2().getRecordKey(), Collectors.mapping(t -> t._2()._1().split("#")[0], Collectors.toList())));

    assertEquals(4, recordKeyToFileComps.size());
    assertEquals(Arrays.asList("f1", "f3", "f4"), recordKeyToFileComps.get("002"));
@@ -252,32 +231,35 @@ public class TestHoodieBloomIndex {
  }

  @Test
-  public void testCheckUUIDsAgainstOneFile()
-      throws IOException, InterruptedException, ClassNotFoundException {
+  public void testCheckUUIDsAgainstOneFile() throws IOException, InterruptedException, ClassNotFoundException {

    // Create some records to use
-    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
-    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":32}";
+    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":32}";
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    HoodieRecord record1 = new HoodieRecord(
-        new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1);
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+        rowChange1);
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    HoodieRecord record2 = new HoodieRecord(
-        new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2);
+    HoodieRecord record2 = new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
+        rowChange2);
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    HoodieRecord record3 = new HoodieRecord(
-        new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3);
+    HoodieRecord record3 = new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
+        rowChange3);
    TestRawTripPayload rowChange4 = new TestRawTripPayload(recordStr4);
-    HoodieRecord record4 = new HoodieRecord(
-        new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()), rowChange4);
+    HoodieRecord record4 = new HoodieRecord(new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()),
+        rowChange4);

-    // We write record1, record2 to a parquet file, but the bloom filter contains (record1, record2, record3).
+    // We write record1, record2 to a parquet file, but the bloom filter contains (record1,
+    // record2, record3).
    BloomFilter filter = new BloomFilter(10000, 0.0000001);
    filter.add(record3.getRecordKey());
-    String filename = writeParquetFile("2016/01/31", Arrays.asList(record1, record2), schema,
-        filter, true);
+    String filename = writeParquetFile("2016/01/31", Arrays.asList(record1, record2), schema, filter, true);

    // The bloom filter contains 3 records
    assertTrue(filter.mightContain(record1.getRecordKey()));
@@ -286,17 +268,16 @@ public class TestHoodieBloomIndex {
    assertFalse(filter.mightContain(record4.getRecordKey()));

    // Compare with file
-    List<String> uuids = Arrays.asList(record1.getRecordKey(), record2.getRecordKey(),
-        record3.getRecordKey(), record4.getRecordKey());
+    List<String> uuids = Arrays.asList(record1.getRecordKey(), record2.getRecordKey(), record3.getRecordKey(),
+        record4.getRecordKey());

-    List<String> results = HoodieBloomIndexCheckFunction
-        .checkCandidatesAgainstFile(jsc.hadoopConfiguration(), uuids,
+    List<String> results = HoodieBloomIndexCheckFunction.checkCandidatesAgainstFile(jsc.hadoopConfiguration(), uuids,
        new Path(basePath + "/2016/01/31/" + filename));
    assertEquals(results.size(), 2);
-    assertTrue(results.get(0).equals("1eb5b87a-1feh-4edd-87b4-6ec96dc405a0")
-        || results.get(1).equals("1eb5b87a-1feh-4edd-87b4-6ec96dc405a0"));
-    assertTrue(results.get(0).equals("2eb5b87b-1feu-4edd-87b4-6ec96dc405a0")
-        || results.get(1).equals("2eb5b87b-1feu-4edd-87b4-6ec96dc405a0"));
+    assertTrue(results.get(0).equals("1eb5b87a-1feh-4edd-87b4-6ec96dc405a0") || results.get(1).equals(
+        "1eb5b87a-1feh-4edd-87b4-6ec96dc405a0"));
+    assertTrue(results.get(0).equals("2eb5b87b-1feu-4edd-87b4-6ec96dc405a0") || results.get(1).equals(
+        "2eb5b87b-1feu-4edd-87b4-6ec96dc405a0"));
    // TODO(vc): Need more coverage on actual filenames
    //assertTrue(results.get(0)._2().equals(filename));
    //assertTrue(results.get(1)._2().equals(filename));
@@ -317,8 +298,7 @@ public class TestHoodieBloomIndex {
    try {
      bloomIndex.tagLocation(recordRDD, table);
    } catch (IllegalArgumentException e) {
-      fail(
-          "EmptyRDD should not result in IllegalArgumentException: Positive number of slices required");
+      fail("EmptyRDD should not result in IllegalArgumentException: Positive number of slices " + "required");
    }
  }

@@ -327,24 +307,27 @@ public class TestHoodieBloomIndex {
  public void testTagLocation() throws Exception {
    // We have some records to be tagged (two different partitions)

-    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
-    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";
+    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    HoodieRecord record1 = new HoodieRecord(
-        new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1);
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+        rowChange1);
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    HoodieRecord record2 = new HoodieRecord(
-        new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2);
+    HoodieRecord record2 = new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
+        rowChange2);
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    HoodieRecord record3 = new HoodieRecord(
-        new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3);
+    HoodieRecord record3 = new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
+        rowChange3);
    TestRawTripPayload rowChange4 = new TestRawTripPayload(recordStr4);
-    HoodieRecord record4 = new HoodieRecord(
-        new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()), rowChange4);
-    JavaRDD<HoodieRecord> recordRDD = jsc
-        .parallelize(Arrays.asList(record1, record2, record3, record4));
+    HoodieRecord record4 = new HoodieRecord(new HoodieKey(rowChange4.getRowKey(), rowChange4.getPartitionPath()),
+        rowChange4);
+    JavaRDD<HoodieRecord> recordRDD = jsc.parallelize(Arrays.asList(record1, record2, record3, record4));

    // Also create the metadata and config
    HoodieTableMetaClient metadata = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
@@ -389,10 +372,14 @@ public class TestHoodieBloomIndex {
  public void testCheckExists() throws Exception {
    // We have some records to be tagged (two different partitions)

-    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
-    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";
+    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"3eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr4 = "{\"_row_key\":\"4eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2015-01-31T03:16:41.415Z\",\"number\":32}";
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
    HoodieKey key1 = new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath());
    HoodieRecord record1 = new HoodieRecord(key1, rowChange1);
@@ -414,8 +401,7 @@ public class TestHoodieBloomIndex {

    // Let's tag
    HoodieBloomIndex bloomIndex = new HoodieBloomIndex(config, jsc);
-    JavaPairRDD<HoodieKey, Optional<String>> taggedRecordRDD = bloomIndex
-        .fetchRecordLocation(keysRDD, table);
+    JavaPairRDD<HoodieKey, Optional<String>> taggedRecordRDD = bloomIndex.fetchRecordLocation(keysRDD, table);

    // Should not find any files
    for (Tuple2<HoodieKey, Optional<String>> record : taggedRecordRDD.collect()) {
@@ -456,16 +442,18 @@ public class TestHoodieBloomIndex {
  @Test
  public void testBloomFilterFalseError() throws IOException, InterruptedException {
    // We have two hoodie records
-    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr1 = "{\"_row_key\":\"1eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"2eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";

    // We write record1 to a parquet file, using a bloom filter having both records
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    HoodieRecord record1 = new HoodieRecord(
-        new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1);
+    HoodieRecord record1 = new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
+        rowChange1);
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    HoodieRecord record2 = new HoodieRecord(
-        new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2);
+    HoodieRecord record2 = new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
+        rowChange2);

    BloomFilter filter = new BloomFilter(10000, 0.0000001);
    filter.add(record2.getRecordKey());
@@ -492,8 +480,8 @@ public class TestHoodieBloomIndex {
    }
  }

-  private String writeParquetFile(String partitionPath, List<HoodieRecord> records, Schema schema,
-      BloomFilter filter, boolean createCommitTime) throws IOException, InterruptedException {
+  private String writeParquetFile(String partitionPath, List<HoodieRecord> records, Schema schema, BloomFilter filter,
+      boolean createCommitTime) throws IOException, InterruptedException {
    Thread.sleep(1000);
    String commitTime = new SimpleDateFormat("yyyyMMddHHmmss").format(new Date());
    String fileId = UUID.randomUUID().toString();
@@ -502,15 +490,14 @@ public class TestHoodieBloomIndex {
    return writeParquetFile(partitionPath, filename, records, schema, filter, createCommitTime);
  }

-  private String writeParquetFile(String partitionPath, String filename, List<HoodieRecord> records,
-      Schema schema,
+  private String writeParquetFile(String partitionPath, String filename, List<HoodieRecord> records, Schema schema,
      BloomFilter filter, boolean createCommitTime) throws IOException {

    if (filter == null) {
      filter = new BloomFilter(10000, 0.0000001);
    }
-    HoodieAvroWriteSupport writeSupport = new HoodieAvroWriteSupport(
-        new AvroSchemaConverter().convert(schema), schema, filter);
+    HoodieAvroWriteSupport writeSupport = new HoodieAvroWriteSupport(new AvroSchemaConverter().convert(schema), schema,
+        filter);
    String commitTime = FSUtils.getCommitTime(filename);
    HoodieParquetConfig config = new HoodieParquetConfig(writeSupport, CompressionCodecName.GZIP,
        ParquetWriter.DEFAULT_BLOCK_SIZE, ParquetWriter.DEFAULT_PAGE_SIZE, 120 * 1024 * 1024,
@@ -525,9 +512,7 @@ public class TestHoodieBloomIndex {
    for (HoodieRecord record : records) {
      GenericRecord avroRecord = (GenericRecord) record.getData().getInsertValue(schema).get();
      HoodieAvroUtils.addCommitMetadataToRecord(avroRecord, commitTime, "" + seqId++);
-      HoodieAvroUtils
-          .addHoodieKeyToRecord(avroRecord, record.getRecordKey(), record.getPartitionPath(),
-              filename);
+      HoodieAvroUtils.addHoodieKeyToRecord(avroRecord, record.getRecordKey(), record.getPartitionPath(), filename);
      writer.writeAvro(record.getRecordKey(), avroRecord);
      filter.add(record.getRecordKey());
    }
@@ -536,9 +521,7 @@ public class TestHoodieBloomIndex {
    if (createCommitTime) {
      // Also make sure the commit is valid
      new File(basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME).mkdirs();
-      new File(
-          basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + commitTime + ".commit")
-          .createNewFile();
+      new File(basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + commitTime + ".commit").createNewFile();
    }
    return filename;
  }
--- a/hoodie-client/src/test/java/com/uber/hoodie/io/TestHoodieCommitArchiveLog.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/io/TestHoodieCommitArchiveLog.java
@@ -77,7 +77,8 @@ public class TestHoodieCommitArchiveLog {
  public void testArchiveDatasetWithArchival() throws IOException {
    HoodieWriteConfig cfg = HoodieWriteConfig.newBuilder().withPath(basePath)
        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
-        .withCompactionConfig(HoodieCompactionConfig.newBuilder().archiveCommitsWith(2, 4).build())
+        .withCompactionConfig(
+            HoodieCompactionConfig.newBuilder().archiveCommitsWith(2, 4).build())
        .forTable("test-trip-table").build();
    HoodieTestUtils.init(hadoopConf, basePath);
    HoodieTestDataGenerator.createCommitFile(basePath, "100");
@@ -88,8 +89,7 @@ public class TestHoodieCommitArchiveLog {
    HoodieTestDataGenerator.createCommitFile(basePath, "105");

    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(fs.getConf(), basePath);
-    HoodieTimeline timeline =
-        metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
+    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();

    assertEquals("Loaded 6 commits and the count should match", 6, timeline.countInstants());

@@ -103,8 +103,7 @@ public class TestHoodieCommitArchiveLog {
    HoodieTestUtils.createInflightCleanFiles(basePath, "106", "107");

    //reload the timeline and get all the commmits before archive
-    timeline = metaClient.getActiveTimeline().reload().getAllCommitsTimeline()
-        .filterCompletedInstants();
+    timeline = metaClient.getActiveTimeline().reload().getAllCommitsTimeline().filterCompletedInstants();
    List<HoodieInstant> originalCommits = timeline.getInstants().collect(Collectors.toList());

    assertEquals("Loaded 6 commits and the count should match", 12, timeline.countInstants());
@@ -118,13 +117,12 @@ public class TestHoodieCommitArchiveLog {
    assertTrue(archiveLog.archiveIfRequired());

    //reload the timeline and remove the remaining commits
-    timeline = metaClient.getActiveTimeline().reload().getAllCommitsTimeline()
-        .filterCompletedInstants();
+    timeline = metaClient.getActiveTimeline().reload().getAllCommitsTimeline().filterCompletedInstants();
    originalCommits.removeAll(timeline.getInstants().collect(Collectors.toList()));

    //read the file
-    HoodieLogFormat.Reader reader = HoodieLogFormat
-        .newReader(fs, new HoodieLogFile(new Path(basePath + "/.hoodie/.commits_.archive.1")),
+    HoodieLogFormat.Reader reader = HoodieLogFormat.newReader(fs,
+        new HoodieLogFile(new Path(basePath + "/.hoodie/.commits_.archive.1")),
        HoodieArchivedMetaEntry.getClassSchema());

    int archivedRecordsCount = 0;
@@ -137,8 +135,7 @@ public class TestHoodieCommitArchiveLog {
      assertEquals("Archived and read records for each block are same", 8, records.size());
      archivedRecordsCount += records.size();
    }
-    assertEquals("Total archived records and total read records are the same count", 8,
-        archivedRecordsCount);
+    assertEquals("Total archived records and total read records are the same count", 8, archivedRecordsCount);

    //make sure the archived commits are the same as the (originalcommits - commitsleft)
    List<String> readCommits = readRecords.stream().map(r -> (GenericRecord) r).map(r -> {
@@ -146,10 +143,8 @@ public class TestHoodieCommitArchiveLog {
    }).collect(Collectors.toList());
    Collections.sort(readCommits);

-    assertEquals(
-        "Read commits map should match the originalCommits - commitsLoadedFromArchival",
-        originalCommits.stream().map(HoodieInstant::getTimestamp).collect(Collectors.toList()),
-        readCommits);
+    assertEquals("Read commits map should match the originalCommits - commitsLoadedFromArchival",
+        originalCommits.stream().map(HoodieInstant::getTimestamp).collect(Collectors.toList()), readCommits);

    // verify in-flight instants after archive
    verifyInflightInstants(metaClient, 3);
@@ -168,15 +163,12 @@ public class TestHoodieCommitArchiveLog {
    HoodieTestDataGenerator.createCommitFile(basePath, "102");
    HoodieTestDataGenerator.createCommitFile(basePath, "103");

-    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
    assertEquals("Loaded 4 commits and the count should match", 4, timeline.countInstants());
    boolean result = archiveLog.archiveIfRequired();
    assertTrue(result);
-    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline()
-        .filterCompletedInstants();
-    assertEquals("Should not archive commits when maxCommitsToKeep is 5", 4,
-        timeline.countInstants());
+    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline().filterCompletedInstants();
+    assertEquals("Should not archive commits when maxCommitsToKeep is 5", 4, timeline.countInstants());
  }

  @Test
@@ -194,21 +186,15 @@ public class TestHoodieCommitArchiveLog {
    HoodieTestDataGenerator.createCommitFile(basePath, "104");
    HoodieTestDataGenerator.createCommitFile(basePath, "105");

-    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
    assertEquals("Loaded 6 commits and the count should match", 6, timeline.countInstants());
    boolean result = archiveLog.archiveIfRequired();
    assertTrue(result);
-    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline()
-        .filterCompletedInstants();
-    assertTrue("Archived commits should always be safe",
-        timeline.containsOrBeforeTimelineStarts("100"));
-    assertTrue("Archived commits should always be safe",
-        timeline.containsOrBeforeTimelineStarts("101"));
-    assertTrue("Archived commits should always be safe",
-        timeline.containsOrBeforeTimelineStarts("102"));
-    assertTrue("Archived commits should always be safe",
-        timeline.containsOrBeforeTimelineStarts("103"));
+    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline().filterCompletedInstants();
+    assertTrue("Archived commits should always be safe", timeline.containsOrBeforeTimelineStarts("100"));
+    assertTrue("Archived commits should always be safe", timeline.containsOrBeforeTimelineStarts("101"));
+    assertTrue("Archived commits should always be safe", timeline.containsOrBeforeTimelineStarts("102"));
+    assertTrue("Archived commits should always be safe", timeline.containsOrBeforeTimelineStarts("103"));
  }

  @Test
@@ -227,16 +213,14 @@ public class TestHoodieCommitArchiveLog {
    HoodieTestDataGenerator.createCommitFile(basePath, "104");
    HoodieTestDataGenerator.createCommitFile(basePath, "105");

-    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline()
-        .filterCompletedInstants();
+    HoodieTimeline timeline = metaClient.getActiveTimeline().getCommitsTimeline().filterCompletedInstants();
    assertEquals("Loaded 6 commits and the count should match", 6, timeline.countInstants());
    boolean result = archiveLog.archiveIfRequired();
    assertTrue(result);
-    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline()
-        .filterCompletedInstants();
+    timeline = metaClient.getActiveTimeline().reload().getCommitsTimeline().filterCompletedInstants();
    assertEquals(
-        "Since we have a savepoint at 101, we should never archive any commit after 101 (we only archive 100)",
-        5, timeline.countInstants());
+        "Since we have a savepoint at 101, we should never archive any commit after 101 (we only " + "archive 100)", 5,
+        timeline.countInstants());
    assertTrue("Archived commits should always be safe",
        timeline.containsInstant(new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, "101")));
    assertTrue("Archived commits should always be safe",
@@ -248,7 +232,7 @@ public class TestHoodieCommitArchiveLog {
  private void verifyInflightInstants(HoodieTableMetaClient metaClient, int expectedTotalInstants) {
    HoodieTimeline timeline = metaClient.getActiveTimeline().reload()
        .getTimelineOfActions(Sets.newHashSet(HoodieTimeline.CLEAN_ACTION)).filterInflights();
-    assertEquals("Loaded inflight clean actions and the count should match",
-        expectedTotalInstants, timeline.countInstants());
+    assertEquals("Loaded inflight clean actions and the count should match", expectedTotalInstants,
+        timeline.countInstants());
  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/io/TestHoodieCompactor.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/io/TestHoodieCompactor.java
@@ -93,32 +93,27 @@ public class TestHoodieCompactor {
  }

  private HoodieWriteConfig.Builder getConfigBuilder() {
-    return HoodieWriteConfig.newBuilder().withPath(basePath)
-        .withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
-        .withCompactionConfig(
-            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024)
-                .withInlineCompaction(false).build())
-        .withStorageConfig(HoodieStorageConfig.newBuilder().limitFileSize(1024 * 1024).build())
-        .forTable("test-trip-table").withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build());
+    return HoodieWriteConfig.newBuilder().withPath(basePath).withSchema(HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA)
+        .withParallelism(2, 2).withCompactionConfig(
+            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024).withInlineCompaction(false)
+                .build()).withStorageConfig(HoodieStorageConfig.newBuilder().limitFileSize(1024 * 1024).build())
+        .forTable("test-trip-table")
+        .withIndexConfig(HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build());
  }

  @Test(expected = IllegalArgumentException.class)
  public void testCompactionOnCopyOnWriteFail() throws Exception {
    HoodieTestUtils.initTableType(hadoopConf, basePath, HoodieTableType.COPY_ON_WRITE);
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieTable table = HoodieTable.getHoodieTable(metaClient, getConfig());
    compactor.compact(jsc, getConfig(), table, HoodieActiveTimeline.createNewCommitTime());
  }

  @Test
  public void testCompactionEmpty() throws Exception {
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieWriteConfig config = getConfig();
-    HoodieTable table = HoodieTable
-        .getHoodieTable(metaClient, config);
+    HoodieTable table = HoodieTable.getHoodieTable(metaClient, config);
    HoodieWriteClient writeClient = new HoodieWriteClient(jsc, config);

    String newCommitTime = writeClient.startCommit();
@@ -126,10 +121,9 @@ public class TestHoodieCompactor {
    JavaRDD<HoodieRecord> recordsRDD = jsc.parallelize(records, 1);
    writeClient.insert(recordsRDD, newCommitTime).collect();

-    JavaRDD<WriteStatus> result =
-        compactor.compact(jsc, getConfig(), table, HoodieActiveTimeline.createNewCommitTime());
-    assertTrue("If there is nothing to compact, result will be empty",
-        result.isEmpty());
+    JavaRDD<WriteStatus> result = compactor
+        .compact(jsc, getConfig(), table, HoodieActiveTimeline.createNewCommitTime());
+    assertTrue("If there is nothing to compact, result will be empty", result.isEmpty());
  }

  @Test
@@ -145,8 +139,7 @@ public class TestHoodieCompactor {
    List<WriteStatus> statuses = writeClient.insert(recordsRDD, newCommitTime).collect();

    // Update all the 100 records
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieTable table = HoodieTable.getHoodieTable(metaClient, config);

    newCommitTime = "101";
@@ -159,19 +152,16 @@ public class TestHoodieCompactor {

    // Write them to corresponding avro logfiles
    HoodieTestUtils
-        .writeRecordsToLogFiles(fs, metaClient.getBasePath(), HoodieTestDataGenerator.avroSchema,
-            updatedRecords);
+        .writeRecordsToLogFiles(fs, metaClient.getBasePath(), HoodieTestDataGenerator.avroSchema, updatedRecords);

    // Verify that all data file has one log file
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    table = HoodieTable.getHoodieTable(metaClient, config);
    for (String partitionPath : dataGen.getPartitionPaths()) {
-      List<FileSlice> groupedLogFiles =
-          table.getRTFileSystemView().getLatestFileSlices(partitionPath)
+      List<FileSlice> groupedLogFiles = table.getRTFileSystemView().getLatestFileSlices(partitionPath)
          .collect(Collectors.toList());
      for (FileSlice fileSlice : groupedLogFiles) {
-        assertEquals("There should be 1 log file written for every data file", 1,
-            fileSlice.getLogFiles().count());
+        assertEquals("There should be 1 log file written for every data file", 1, fileSlice.getLogFiles().count());
      }
    }

@@ -179,18 +169,19 @@ public class TestHoodieCompactor {
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    table = HoodieTable.getHoodieTable(metaClient, config);

-    JavaRDD<WriteStatus> result =
-        compactor.compact(jsc, getConfig(), table, HoodieActiveTimeline.createNewCommitTime());
+    JavaRDD<WriteStatus> result = compactor
+        .compact(jsc, getConfig(), table, HoodieActiveTimeline.createNewCommitTime());

    // Verify that all partition paths are present in the WriteStatus result
    for (String partitionPath : dataGen.getPartitionPaths()) {
      List<WriteStatus> writeStatuses = result.collect();
      assertTrue(writeStatuses.stream()
-          .filter(writeStatus -> writeStatus.getStat().getPartitionPath()
-              .contentEquals(partitionPath)).count() > 0);
+          .filter(writeStatus -> writeStatus.getStat().getPartitionPath().contentEquals(partitionPath))
+          .count() > 0);
    }
  }

-  // TODO - after modifying HoodieReadClient to support realtime tables - add more tests to make sure the data read is the updated data (compaction correctness)
+  // TODO - after modifying HoodieReadClient to support realtime tables - add more tests to make
+  // sure the data read is the updated data (compaction correctness)
  // TODO - add more test cases for compactions after a failed commit/compaction
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieCompactionStrategy.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieCompactionStrategy.java
@@ -16,6 +16,9 @@

 package com.uber.hoodie.io.strategy;

+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertTrue;
+
 import com.beust.jcommander.internal.Lists;
 import com.google.common.collect.Maps;
 import com.uber.hoodie.config.HoodieCompactionConfig;
@@ -25,15 +28,11 @@ import com.uber.hoodie.io.compact.strategy.BoundedIOCompactionStrategy;
 import com.uber.hoodie.io.compact.strategy.DayBasedCompactionStrategy;
 import com.uber.hoodie.io.compact.strategy.LogFileSizeBasedCompactionStrategy;
 import com.uber.hoodie.io.compact.strategy.UnBoundedCompactionStrategy;
-import org.junit.Test;
-
 import java.util.List;
 import java.util.Map;
 import java.util.Random;
 import java.util.stream.Collectors;
-
-import static org.junit.Assert.assertEquals;
-import static org.junit.Assert.assertTrue;
+import org.junit.Test;

 public class TestHoodieCompactionStrategy {

@@ -48,8 +47,7 @@ public class TestHoodieCompactionStrategy {
    sizesMap.put(100 * MB, Lists.newArrayList(MB));
    sizesMap.put(90 * MB, Lists.newArrayList(1024 * MB));
    UnBoundedCompactionStrategy strategy = new UnBoundedCompactionStrategy();
-    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp")
-        .withCompactionConfig(
+    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp").withCompactionConfig(
        HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy).build()).build();
    List<CompactionOperation> operations = createCompactionOperations(writeConfig, sizesMap);
    List<CompactionOperation> returned = strategy.orderAndFilter(writeConfig, operations);
@@ -64,23 +62,19 @@ public class TestHoodieCompactionStrategy {
    sizesMap.put(100 * MB, Lists.newArrayList(MB));
    sizesMap.put(90 * MB, Lists.newArrayList(1024 * MB));
    BoundedIOCompactionStrategy strategy = new BoundedIOCompactionStrategy();
-    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp")
-        .withCompactionConfig(
-            HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy)
-                .withTargetIOPerCompactionInMB(400).build()).build();
+    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp").withCompactionConfig(
+        HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy).withTargetIOPerCompactionInMB(400).build())
+        .build();
    List<CompactionOperation> operations = createCompactionOperations(writeConfig, sizesMap);
    List<CompactionOperation> returned = strategy.orderAndFilter(writeConfig, operations);

-    assertTrue("BoundedIOCompaction should have resulted in fewer compactions",
-        returned.size() < operations.size());
-    assertEquals("BoundedIOCompaction should have resulted in 2 compactions being chosen",
-        2, returned.size());
+    assertTrue("BoundedIOCompaction should have resulted in fewer compactions", returned.size() < operations.size());
+    assertEquals("BoundedIOCompaction should have resulted in 2 compactions being chosen", 2, returned.size());
    // Total size of all the log files
-    Long returnedSize = returned.stream()
-        .map(s -> s.getMetrics().get(BoundedIOCompactionStrategy.TOTAL_IO_MB)).map(s -> (Long) s)
-        .reduce((size1, size2) -> size1 + size2).orElse(0L);
-    assertEquals("Should chose the first 2 compactions which should result in a total IO of 690 MB",
-        610, (long) returnedSize);
+    Long returnedSize = returned.stream().map(s -> s.getMetrics().get(BoundedIOCompactionStrategy.TOTAL_IO_MB))
+        .map(s -> (Long) s).reduce((size1, size2) -> size1 + size2).orElse(0L);
+    assertEquals("Should chose the first 2 compactions which should result in a total IO of 690 MB", 610,
+        (long) returnedSize);
  }

  @Test
@@ -91,23 +85,20 @@ public class TestHoodieCompactionStrategy {
    sizesMap.put(100 * MB, Lists.newArrayList(MB));
    sizesMap.put(90 * MB, Lists.newArrayList(1024 * MB));
    LogFileSizeBasedCompactionStrategy strategy = new LogFileSizeBasedCompactionStrategy();
-    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp")
-        .withCompactionConfig(
-            HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy)
-                .withTargetIOPerCompactionInMB(400).build()).build();
+    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp").withCompactionConfig(
+        HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy).withTargetIOPerCompactionInMB(400).build())
+        .build();
    List<CompactionOperation> operations = createCompactionOperations(writeConfig, sizesMap);
    List<CompactionOperation> returned = strategy.orderAndFilter(writeConfig, operations);

    assertTrue("LogFileSizeBasedCompactionStrategy should have resulted in fewer compactions",
        returned.size() < operations.size());
-    assertEquals("LogFileSizeBasedCompactionStrategy should have resulted in 1 compaction",
-        1, returned.size());
+    assertEquals("LogFileSizeBasedCompactionStrategy should have resulted in 1 compaction", 1, returned.size());
    // Total size of all the log files
-    Long returnedSize = returned.stream()
-        .map(s -> s.getMetrics().get(BoundedIOCompactionStrategy.TOTAL_IO_MB)).map(s -> (Long) s)
-        .reduce((size1, size2) -> size1 + size2).orElse(0L);
-    assertEquals("Should chose the first 2 compactions which should result in a total IO of 690 MB",
-        1204, (long) returnedSize);
+    Long returnedSize = returned.stream().map(s -> s.getMetrics().get(BoundedIOCompactionStrategy.TOTAL_IO_MB))
+        .map(s -> (Long) s).reduce((size1, size2) -> size1 + size2).orElse(0L);
+    assertEquals("Should chose the first 2 compactions which should result in a total IO of 690 MB", 1204,
+        (long) returnedSize);
  }

  @Test
@@ -118,10 +109,9 @@ public class TestHoodieCompactionStrategy {
    sizesMap.put(100 * MB, Lists.newArrayList(MB));
    sizesMap.put(90 * MB, Lists.newArrayList(1024 * MB));
    DayBasedCompactionStrategy strategy = new DayBasedCompactionStrategy();
-    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp")
-            .withCompactionConfig(
-                    HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy)
-                            .withTargetIOPerCompactionInMB(400).build()).build();
+    HoodieWriteConfig writeConfig = HoodieWriteConfig.newBuilder().withPath("/tmp").withCompactionConfig(
+        HoodieCompactionConfig.newBuilder().withCompactionStrategy(strategy).withTargetIOPerCompactionInMB(400).build())
+        .build();
    List<CompactionOperation> operations = createCompactionOperations(writeConfig, sizesMap);
    List<CompactionOperation> returned = strategy.orderAndFilter(writeConfig, operations);

@@ -130,8 +120,7 @@ public class TestHoodieCompactionStrategy {

    int comparision = strategy.getComparator().compare(returned.get(returned.size() - 1), returned.get(0));
    // Either the partition paths are sorted in descending order or they are equal
-    assertTrue("DayBasedCompactionStrategy should sort partitions in descending order",
-            comparision >= 0);
+    assertTrue("DayBasedCompactionStrategy should sort partitions in descending order", comparision >= 0);
  }

  private List<CompactionOperation> createCompactionOperations(HoodieWriteConfig config,
@@ -140,8 +129,7 @@ public class TestHoodieCompactionStrategy {
    sizesMap.forEach((k, v) -> {
      operations.add(new CompactionOperation(TestHoodieDataFile.newDataFile(k),
          partitionPaths[new Random().nextInt(partitionPaths.length - 1)],
-          v.stream().map(TestHoodieLogFile::newLogFile).collect(
-              Collectors.toList()), config));
+          v.stream().map(TestHoodieLogFile::newLogFile).collect(Collectors.toList()), config));
    });
    return operations;
  }
--- a/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieDataFile.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieDataFile.java
@@ -28,6 +28,10 @@ public class TestHoodieDataFile extends HoodieDataFile {
    this.size = size;
  }

+  public static HoodieDataFile newDataFile(long size) {
+    return new TestHoodieDataFile(size);
+  }
+
  @Override
  public String getPath() {
    return "/tmp/test";
@@ -43,13 +47,8 @@ public class TestHoodieDataFile extends HoodieDataFile {
    return "100";
  }

-
  @Override
  public long getFileSize() {
    return size;
  }
-
-  public static HoodieDataFile newDataFile(long size) {
-    return new TestHoodieDataFile(size);
-  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieLogFile.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/io/strategy/TestHoodieLogFile.java
@@ -29,6 +29,10 @@ public class TestHoodieLogFile extends HoodieLogFile {
    this.size = size;
  }

+  public static HoodieLogFile newLogFile(long size) {
+    return new TestHoodieLogFile(size);
+  }
+
  @Override
  public Path getPath() {
    return new Path("/tmp/test-log");
@@ -38,8 +42,4 @@ public class TestHoodieLogFile extends HoodieLogFile {
  public Optional<Long> getFileSize() {
    return Optional.of(size);
  }
-
-  public static HoodieLogFile newLogFile(long size) {
-    return new TestHoodieLogFile(size);
-  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/metrics/TestHoodieMetrics.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/metrics/TestHoodieMetrics.java
@@ -40,7 +40,6 @@ public class TestHoodieMetrics {
  @Test
  public void testRegisterGauge() {
    metrics.registerGauge("metric1", 123L);
-    assertTrue(Metrics.getInstance().getRegistry().getGauges().get("metric1").getValue().toString()
-        .equals("123"));
+    assertTrue(Metrics.getInstance().getRegistry().getGauges().get("metric1").getValue().toString().equals("123"));
  }
 }
--- a/hoodie-client/src/test/java/com/uber/hoodie/table/TestCopyOnWriteTable.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/table/TestCopyOnWriteTable.java
@@ -89,14 +89,13 @@ public class TestCopyOnWriteTable {

    String commitTime = HoodieTestUtils.makeNewCommitTime();
    HoodieWriteConfig config = makeHoodieClientConfig();
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieTable table = HoodieTable.getHoodieTable(metaClient, config);

    HoodieCreateHandle io = new HoodieCreateHandle(config, commitTime, table, partitionPath);
    Path newPath = io.makeNewPath(record.getPartitionPath(), unitNumber, fileName);
-    assertTrue(newPath.toString().equals(this.basePath + "/" + partitionPath + "/" + FSUtils
-        .makeDataFileName(commitTime, unitNumber, fileName)));
+    assertTrue(newPath.toString().equals(
+        this.basePath + "/" + partitionPath + "/" + FSUtils.makeDataFileName(commitTime, unitNumber, fileName)));
  }

  private HoodieWriteConfig makeHoodieClientConfig() throws Exception {
@@ -105,8 +104,7 @@ public class TestCopyOnWriteTable {

  private HoodieWriteConfig.Builder makeHoodieClientConfigBuilder() throws Exception {
    // Prepare the AvroParquetIO
-    String schemaStr = IOUtils
-        .toString(getClass().getResourceAsStream("/exampleSchema.txt"), "UTF-8");
+    String schemaStr = IOUtils.toString(getClass().getResourceAsStream("/exampleSchema.txt"), "UTF-8");
    return HoodieWriteConfig.newBuilder().withPath(basePath).withSchema(schemaStr);
  }

@@ -122,28 +120,27 @@ public class TestCopyOnWriteTable {
    HoodieCopyOnWriteTable table = new HoodieCopyOnWriteTable(config, metadata);

    // Get some records belong to the same partition (2016/01/31)
-    String recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
-    String recordStr4 = "{\"_row_key\":\"8eb5b87d-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":51}";
+    String recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr4 = "{\"_row_key\":\"8eb5b87d-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":51}";

    List<HoodieRecord> records = new ArrayList<>();
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
-            rowChange1));
+    records.add(new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1));
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
-            rowChange2));
+    records.add(new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2));
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
-            rowChange3));
+    records.add(new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3));

    // Insert new records
    HoodieClientTestUtils.collectStatuses(table.handleInsert(firstCommitTime, records.iterator()));
-    // We should have a parquet file generated (TODO: better control # files after we revise AvroParquetIO)
+    // We should have a parquet file generated (TODO: better control # files after we revise
+    // AvroParquetIO)
    File parquetFile = null;
    for (File file : new File(this.basePath + partitionPath).listFiles()) {
      if (file.getName().endsWith(".parquet")) {
@@ -155,18 +152,17 @@ public class TestCopyOnWriteTable {

    // Read out the bloom filter and make sure filter can answer record exist or not
    Path parquetFilePath = new Path(parquetFile.getAbsolutePath());
-    BloomFilter filter = ParquetUtils
-        .readBloomFilterFromParquetMetadata(jsc.hadoopConfiguration(), parquetFilePath);
+    BloomFilter filter = ParquetUtils.readBloomFilterFromParquetMetadata(jsc.hadoopConfiguration(), parquetFilePath);
    for (HoodieRecord record : records) {
      assertTrue(filter.mightContain(record.getRecordKey()));
    }
    // Create a commit file
-    new File(this.basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/"
-        + FSUtils.getCommitTime(parquetFile.getName()) + ".commit").createNewFile();
+    new File(
+        this.basePath + "/" + HoodieTableMetaClient.METAFOLDER_NAME + "/" + FSUtils.getCommitTime(parquetFile.getName())
+            + ".commit").createNewFile();

    // Read the parquet file, check the record content
-    List<GenericRecord> fileRecords = ParquetUtils
-        .readAvroRecords(jsc.hadoopConfiguration(), parquetFilePath);
+    List<GenericRecord> fileRecords = ParquetUtils.readAvroRecords(jsc.hadoopConfiguration(), parquetFilePath);
    GenericRecord newRecord;
    int index = 0;
    for (GenericRecord record : fileRecords) {
@@ -175,13 +171,12 @@ public class TestCopyOnWriteTable {
    }

    // We update the 1st record & add a new record
-    String updateRecordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String updateRecordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
    TestRawTripPayload updateRowChanges1 = new TestRawTripPayload(updateRecordStr1);
    HoodieRecord updatedRecord1 = new HoodieRecord(
-        new HoodieKey(updateRowChanges1.getRowKey(), updateRowChanges1.getPartitionPath()),
-        updateRowChanges1);
-    updatedRecord1.setCurrentLocation(
-        new HoodieRecordLocation(null, FSUtils.getFileId(parquetFile.getName())));
+        new HoodieKey(updateRowChanges1.getRowKey(), updateRowChanges1.getPartitionPath()), updateRowChanges1);
+    updatedRecord1.setCurrentLocation(new HoodieRecordLocation(null, FSUtils.getFileId(parquetFile.getName())));

    TestRawTripPayload rowChange4 = new TestRawTripPayload(recordStr4);
    HoodieRecord insertedRecord1 = new HoodieRecord(
@@ -201,9 +196,8 @@ public class TestCopyOnWriteTable {
    File updatedParquetFile = null;
    for (File file : new File(basePath + "/2016/01/31").listFiles()) {
      if (file.getName().endsWith(".parquet")) {
-        if (FSUtils.getFileId(file.getName())
-            .equals(FSUtils.getFileId(parquetFile.getName())) &&
-            HoodieTimeline.compareTimestamps(FSUtils.getCommitTime(file.getName()),
+        if (FSUtils.getFileId(file.getName()).equals(FSUtils.getFileId(parquetFile.getName()))
+            && HoodieTimeline.compareTimestamps(FSUtils.getCommitTime(file.getName()),
            FSUtils.getCommitTime(parquetFile.getName()), HoodieTimeline.GREATER)) {
          updatedParquetFile = file;
          break;
@@ -213,8 +207,8 @@ public class TestCopyOnWriteTable {
    assertTrue(updatedParquetFile != null);
    // Check whether the record has been updated
    Path updatedParquetFilePath = new Path(updatedParquetFile.getAbsolutePath());
-    BloomFilter updatedFilter = ParquetUtils
-        .readBloomFilterFromParquetMetadata(jsc.hadoopConfiguration(), updatedParquetFilePath);
+    BloomFilter updatedFilter = ParquetUtils.readBloomFilterFromParquetMetadata(jsc.hadoopConfiguration(),
+        updatedParquetFilePath);
    for (HoodieRecord record : records) {
      // No change to the _row_key
      assertTrue(updatedFilter.mightContain(record.getRecordKey()));
@@ -223,8 +217,7 @@ public class TestCopyOnWriteTable {
    assertTrue(updatedFilter.mightContain(insertedRecord1.getRecordKey()));
    records.add(insertedRecord1);// add this so it can further check below

-    ParquetReader updatedReader = ParquetReader
-        .builder(new AvroReadSupport<>(), updatedParquetFilePath).build();
+    ParquetReader updatedReader = ParquetReader.builder(new AvroReadSupport<>(), updatedParquetFilePath).build();
    index = 0;
    while ((newRecord = (GenericRecord) updatedReader.read()) != null) {
      assertTrue(newRecord.get("_row_key").toString().equals(records.get(index).getRecordKey()));
@@ -246,13 +239,9 @@ public class TestCopyOnWriteTable {
    List<HoodieRecord> records = new ArrayList<>();
    for (int i = 0; i < n; i++) {
      String recordStr = String.format("{\"_row_key\":\"%s\",\"time\":\"%s\",\"number\":%d}",
-          UUID.randomUUID().toString(),
-          time,
-          i);
+          UUID.randomUUID().toString(), time, i);
      TestRawTripPayload rowChange = new TestRawTripPayload(recordStr);
-      records.add(new HoodieRecord(
-          new HoodieKey(rowChange.getRowKey(), rowChange.getPartitionPath()),
-          rowChange));
+      records.add(new HoodieRecord(new HoodieKey(rowChange.getRowKey(), rowChange.getPartitionPath()), rowChange));
    }
    return records;
  }
@@ -261,31 +250,28 @@ public class TestCopyOnWriteTable {
  @Test
  public void testMetadataAggregateFromWriteStatus() throws Exception {
    // Prepare the AvroParquetIO
-    HoodieWriteConfig config = makeHoodieClientConfigBuilder()
-        .withWriteStatusClass(MetadataMergeWriteStatus.class).build();
+    HoodieWriteConfig config = makeHoodieClientConfigBuilder().withWriteStatusClass(MetadataMergeWriteStatus.class)
+        .build();
    String firstCommitTime = HoodieTestUtils.makeNewCommitTime();
    HoodieTableMetaClient metadata = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);

    HoodieCopyOnWriteTable table = new HoodieCopyOnWriteTable(config, metadata);

    // Get some records belong to the same partition (2016/01/31)
-    String recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
-    String recordStr2 = "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
-    String recordStr3 = "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";
+    String recordStr1 = "{\"_row_key\":\"8eb5b87a-1feh-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":12}";
+    String recordStr2 = "{\"_row_key\":\"8eb5b87b-1feu-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:20:41.415Z\",\"number\":100}";
+    String recordStr3 = "{\"_row_key\":\"8eb5b87c-1fej-4edd-87b4-6ec96dc405a0\","
+        + "\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":15}";

    List<HoodieRecord> records = new ArrayList<>();
    TestRawTripPayload rowChange1 = new TestRawTripPayload(recordStr1);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()),
-            rowChange1));
+    records.add(new HoodieRecord(new HoodieKey(rowChange1.getRowKey(), rowChange1.getPartitionPath()), rowChange1));
    TestRawTripPayload rowChange2 = new TestRawTripPayload(recordStr2);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()),
-            rowChange2));
+    records.add(new HoodieRecord(new HoodieKey(rowChange2.getRowKey(), rowChange2.getPartitionPath()), rowChange2));
    TestRawTripPayload rowChange3 = new TestRawTripPayload(recordStr3);
-    records.add(
-        new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()),
-            rowChange3));
+    records.add(new HoodieRecord(new HoodieKey(rowChange3.getRowKey(), rowChange3.getPartitionPath()), rowChange3));

    // Insert new records
    List<WriteStatus> writeStatuses = HoodieClientTestUtils
@@ -293,7 +279,8 @@ public class TestCopyOnWriteTable {
    Map<String, String> allWriteStatusMergedMetadataMap = MetadataMergeWriteStatus
        .mergeMetadataForWriteStatuses(writeStatuses);
    assertTrue(allWriteStatusMergedMetadataMap.containsKey("InputRecordCount_1506582000"));
-    // For metadata key InputRecordCount_1506582000, value is 2 for each record. So sum of this should be 2 * 3
+    // For metadata key InputRecordCount_1506582000, value is 2 for each record. So sum of this
+    // should be 2 * 3
    assertEquals("6", allWriteStatusMergedMetadataMap.get("InputRecordCount_1506582000"));
  }

@@ -314,26 +301,19 @@ public class TestCopyOnWriteTable {
    List<WriteStatus> statuses = HoodieClientTestUtils
        .collectStatuses(table.handleInsert(commitTime, records.iterator()));
    WriteStatus status = statuses.get(0);
-    Path partialFile = new Path(String.format("%s/%s/%s",
-        basePath,
-        status.getPartitionPath(),
-        FSUtils.makeDataFileName(commitTime, 0, status.getFileId()))
-    );
+    Path partialFile = new Path(String.format("%s/%s/%s", basePath, status.getPartitionPath(),
+        FSUtils.makeDataFileName(commitTime, 0, status.getFileId())));
    assertTrue(fs.exists(partialFile));

    // When we retry
    records = newHoodieRecords(10, "2016-01-31T03:16:41.415Z");
    records.addAll(newHoodieRecords(1, "2016-02-01T03:16:41.415Z"));

-    statuses = HoodieClientTestUtils
-        .collectStatuses(table.handleInsert(commitTime, records.iterator()));
+    statuses = HoodieClientTestUtils.collectStatuses(table.handleInsert(commitTime, records.iterator()));
    status = statuses.get(0);

-    Path retriedFIle = new Path(String.format("%s/%s/%s",
-        basePath,
-        status.getPartitionPath(),
-        FSUtils.makeDataFileName(commitTime, 0, status.getFileId()))
-    );
+    Path retriedFIle = new Path(String.format("%s/%s/%s", basePath, status.getPartitionPath(),
+        FSUtils.makeDataFileName(commitTime, 0, status.getFileId())));
    assertTrue(fs.exists(retriedFIle));
    assertFalse(fs.exists(partialFile));
  }
@@ -371,8 +351,7 @@ public class TestCopyOnWriteTable {
    records.addAll(newHoodieRecords(1, "2016-02-02T03:16:41.415Z"));

    // Insert new records
-    returnedStatuses = HoodieClientTestUtils
-        .collectStatuses(table.handleInsert(commitTime, records.iterator()));
+    returnedStatuses = HoodieClientTestUtils.collectStatuses(table.handleInsert(commitTime, records.iterator()));

    assertEquals(3, returnedStatuses.size());
    assertEquals("2016/01/31", returnedStatuses.get(0).getPartitionPath());
@@ -389,8 +368,8 @@ public class TestCopyOnWriteTable {
  @Test
  public void testFileSizeUpsertRecords() throws Exception {
    HoodieWriteConfig config = makeHoodieClientConfigBuilder().withStorageConfig(
-        HoodieStorageConfig.newBuilder().limitFileSize(64 * 1024).parquetBlockSize(64 * 1024)
-            .parquetPageSize(64 * 1024).build()).build();
+        HoodieStorageConfig.newBuilder().limitFileSize(64 * 1024).parquetBlockSize(64 * 1024).parquetPageSize(64 * 1024)
+            .build()).build();
    String commitTime = HoodieTestUtils.makeNewCommitTime();
    HoodieTableMetaClient metadata = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieCopyOnWriteTable table = new HoodieCopyOnWriteTable(config, metadata);
@@ -398,12 +377,11 @@ public class TestCopyOnWriteTable {
    List<HoodieRecord> records = new ArrayList<>();
    // Approx 1150 records are written for block size of 64KB
    for (int i = 0; i < 2000; i++) {
-      String recordStr = "{\"_row_key\":\"" + UUID.randomUUID().toString()
-          + "\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":" + i + "}";
+      String recordStr =
+          "{\"_row_key\":\"" + UUID.randomUUID().toString() + "\",\"time\":\"2016-01-31T03:16:41.415Z\",\"number\":" + i
+              + "}";
      TestRawTripPayload rowChange = new TestRawTripPayload(recordStr);
-      records
-          .add(new HoodieRecord(new HoodieKey(rowChange.getRowKey(), rowChange.getPartitionPath()),
-              rowChange));
+      records.add(new HoodieRecord(new HoodieKey(rowChange.getRowKey(), rowChange.getPartitionPath()), rowChange));
    }

    // Insert new records
@@ -412,39 +390,30 @@ public class TestCopyOnWriteTable {
    // Check the updated file
    int counts = 0;
    for (File file : new File(basePath + "/2016/01/31").listFiles()) {
-      if (file.getName().endsWith(".parquet") && FSUtils.getCommitTime(file.getName())
-          .equals(commitTime)) {
+      if (file.getName().endsWith(".parquet") && FSUtils.getCommitTime(file.getName()).equals(commitTime)) {
        System.out.println(file.getName() + "-" + file.length());
        counts++;
      }
    }
-    assertEquals(
-        "If the number of records are more than 1150, then there should be a new file", 3,
-        counts);
+    assertEquals("If the number of records are more than 1150, then there should be a new file", 3, counts);
  }


-  private List<HoodieCopyOnWriteTable.InsertBucket> testUpsertPartitioner(int smallFileSize,
-      int numInserts,
-      int numUpdates,
-      int fileSize,
-      boolean autoSplitInserts) throws Exception {
-    final String TEST_PARTITION_PATH = "2016/09/26";
-    HoodieWriteConfig config = makeHoodieClientConfigBuilder()
-        .withCompactionConfig(HoodieCompactionConfig.newBuilder()
-            .compactionSmallFileSize(smallFileSize).insertSplitSize(100)
-            .autoTuneInsertSplits(autoSplitInserts).build())
-        .withStorageConfig(HoodieStorageConfig.newBuilder().limitFileSize(1000 * 1024).build())
-        .build();
+  private List<HoodieCopyOnWriteTable.InsertBucket> testUpsertPartitioner(int smallFileSize, int numInserts,
+      int numUpdates, int fileSize, boolean autoSplitInserts) throws Exception {
+    final String testPartitionPath = "2016/09/26";
+    HoodieWriteConfig config = makeHoodieClientConfigBuilder().withCompactionConfig(
+        HoodieCompactionConfig.newBuilder().compactionSmallFileSize(smallFileSize).insertSplitSize(100)
+            .autoTuneInsertSplits(autoSplitInserts).build()).withStorageConfig(
+        HoodieStorageConfig.newBuilder().limitFileSize(1000 * 1024).build()).build();

    HoodieClientTestUtils.fakeCommitFile(basePath, "001");
-    HoodieClientTestUtils.fakeDataFile(basePath, TEST_PARTITION_PATH, "001", "file1", fileSize);
+    HoodieClientTestUtils.fakeDataFile(basePath, testPartitionPath, "001", "file1", fileSize);

    HoodieTableMetaClient metadata = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieCopyOnWriteTable table = new HoodieCopyOnWriteTable(config, metadata);

-    HoodieTestDataGenerator dataGenerator = new HoodieTestDataGenerator(
-        new String[]{TEST_PARTITION_PATH});
+    HoodieTestDataGenerator dataGenerator = new HoodieTestDataGenerator(new String[] {testPartitionPath});
    List<HoodieRecord> insertRecords = dataGenerator.generateInserts("001", numInserts);
    List<HoodieRecord> updateRecords = dataGenerator.generateUpdates("001", numUpdates);
    for (HoodieRecord updateRec : updateRecords) {
@@ -454,8 +423,8 @@ public class TestCopyOnWriteTable {
    records.addAll(insertRecords);
    records.addAll(updateRecords);
    WorkloadProfile profile = new WorkloadProfile(jsc.parallelize(records));
-    HoodieCopyOnWriteTable.UpsertPartitioner partitioner = (HoodieCopyOnWriteTable.UpsertPartitioner)
-        table.getUpsertPartitioner(profile);
+    HoodieCopyOnWriteTable.UpsertPartitioner partitioner =
+        (HoodieCopyOnWriteTable.UpsertPartitioner) table.getUpsertPartitioner(profile);

    assertEquals("Should have 3 partitions", 3, partitioner.numPartitions());
    assertEquals("Bucket 0 is UPDATE", HoodieCopyOnWriteTable.BucketType.UPDATE,
@@ -464,40 +433,35 @@ public class TestCopyOnWriteTable {
        partitioner.getBucketInfo(1).bucketType);
    assertEquals("Bucket 2 is INSERT", HoodieCopyOnWriteTable.BucketType.INSERT,
        partitioner.getBucketInfo(2).bucketType);
-    assertEquals("Update record should have gone to the 1 update partiton", 0,
-        partitioner.getPartition(new Tuple2<>(updateRecords.get(0).getKey(),
-            Option.apply(updateRecords.get(0).getCurrentLocation()))));
-    return partitioner.getInsertBuckets(TEST_PARTITION_PATH);
+    assertEquals("Update record should have gone to the 1 update partiton", 0, partitioner.getPartition(
+        new Tuple2<>(updateRecords.get(0).getKey(), Option.apply(updateRecords.get(0).getCurrentLocation()))));
+    return partitioner.getInsertBuckets(testPartitionPath);
  }


  @Test
  public void testUpsertPartitioner() throws Exception {
    // Inserts + Updates... Check all updates go together & inserts subsplit
-    List<HoodieCopyOnWriteTable.InsertBucket> insertBuckets = testUpsertPartitioner(0, 200, 100,
-        1024, false);
+    List<HoodieCopyOnWriteTable.InsertBucket> insertBuckets = testUpsertPartitioner(0, 200, 100, 1024, false);
    assertEquals("Total of 2 insert buckets", 2, insertBuckets.size());
  }


  @Test
  public void testUpsertPartitionerWithSmallInsertHandling() throws Exception {
-    // Inserts + Updates .. Check updates go together & inserts subsplit, after expanding smallest file
-    List<HoodieCopyOnWriteTable.InsertBucket> insertBuckets = testUpsertPartitioner(1000 * 1024,
-        400, 100, 800 * 1024, false);
+    // Inserts + Updates .. Check updates go together & inserts subsplit, after expanding
+    // smallest file
+    List<HoodieCopyOnWriteTable.InsertBucket> insertBuckets = testUpsertPartitioner(1000 * 1024, 400, 100, 800 * 1024,
+        false);
    assertEquals("Total of 3 insert buckets", 3, insertBuckets.size());
-    assertEquals("First insert bucket must be same as update bucket", 0,
-        insertBuckets.get(0).bucketNumber);
-    assertEquals("First insert bucket should have weight 0.5", 0.5, insertBuckets.get(0).weight,
-        0.01);
+    assertEquals("First insert bucket must be same as update bucket", 0, insertBuckets.get(0).bucketNumber);
+    assertEquals("First insert bucket should have weight 0.5", 0.5, insertBuckets.get(0).weight, 0.01);

    // Now with insert split size auto tuned
    insertBuckets = testUpsertPartitioner(1000 * 1024, 2400, 100, 800 * 1024, true);
    assertEquals("Total of 3 insert buckets", 3, insertBuckets.size());
-    assertEquals("First insert bucket must be same as update bucket", 0,
-        insertBuckets.get(0).bucketNumber);
-    assertEquals("First insert bucket should have weight 0.5", 200.0 / 2400,
-        insertBuckets.get(0).weight, 0.01);
+    assertEquals("First insert bucket must be same as update bucket", 0, insertBuckets.get(0).bucketNumber);
+    assertEquals("First insert bucket should have weight 0.5", 200.0 / 2400, insertBuckets.get(0).weight, 0.01);
  }

  @After
--- a/hoodie-client/src/test/java/com/uber/hoodie/table/TestMergeOnReadTable.java
+++ b/hoodie-client/src/test/java/com/uber/hoodie/table/TestMergeOnReadTable.java
@@ -18,7 +18,6 @@

 package com.uber.hoodie.table;

-
 import static com.uber.hoodie.common.HoodieTestDataGenerator.TRIP_EXAMPLE_SCHEMA;
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertFalse;
@@ -76,15 +75,14 @@ import org.junit.rules.TemporaryFolder;

 public class TestMergeOnReadTable {

-  private transient JavaSparkContext jsc = null;
-  private transient SQLContext sqlContext;
  private static String basePath = null;
-
  //NOTE : Be careful in using DFS (FileSystem.class) vs LocalFs(RawLocalFileSystem.class)
  //The implementation and gurantees of many API's differ, for example check rename(src,dst)
  private static MiniDFSCluster dfsCluster;
  private static DistributedFileSystem dfs;
  private static HdfsTestService hdfsTestService;
+  private transient JavaSparkContext jsc = null;
+  private transient SQLContext sqlContext;

  @AfterClass
  public static void cleanUp() throws Exception {
@@ -92,13 +90,15 @@ public class TestMergeOnReadTable {
      hdfsTestService.stop();
      dfsCluster.shutdown();
    }
-    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the same JVM
+    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the
+    // same JVM
    FileSystem.closeAll();
  }

  @BeforeClass
  public static void setUpDFS() throws IOException {
-    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the same JVM
+    // Need to closeAll to clear FileSystem.Cache, required because DFS and LocalFS used in the
+    // same JVM
    FileSystem.closeAll();
    if (hdfsTestService == null) {
      hdfsTestService = new HdfsTestService();
@@ -111,8 +111,7 @@ public class TestMergeOnReadTable {
  @Before
  public void init() throws IOException {
    // Initialize a local spark env
-    jsc = new JavaSparkContext(
-        HoodieClientTestUtils.getSparkConfForTest("TestHoodieMergeOnReadTable"));
+    jsc = new JavaSparkContext(HoodieClientTestUtils.getSparkConfForTest("TestHoodieMergeOnReadTable"));

    // Create a temp folder as the base path
    TemporaryFolder folder = new TemporaryFolder();
@@ -154,28 +153,23 @@ public class TestMergeOnReadTable {
    List<WriteStatus> statuses = client.upsert(writeRecords, newCommitTime).collect();
    assertNoWriteErrors(statuses);

-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        cfg.getBasePath());
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    HoodieTable hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);

-    Optional<HoodieInstant> deltaCommit =
-        metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
+    Optional<HoodieInstant> deltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
    assertTrue(deltaCommit.isPresent());
    assertEquals("Delta commit should be 001", "001", deltaCommit.get().getTimestamp());

-    Optional<HoodieInstant> commit =
-        metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
+    Optional<HoodieInstant> commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertFalse(commit.isPresent());

-    FileStatus[] allFiles = HoodieTestUtils
-        .listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
+    FileStatus[] allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    TableFileSystemView.ReadOptimizedView roView = new HoodieTableFileSystemView(metaClient,
        hoodieTable.getCommitTimeline().filterCompletedInstants(), allFiles);
    Stream<HoodieDataFile> dataFilesToRead = roView.getLatestDataFiles();
    assertTrue(!dataFilesToRead.findAny().isPresent());

-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue("RealtimeTableView should list the parquet files we wrote in the delta commit",
        dataFilesToRead.findAny().isPresent());
@@ -209,21 +203,17 @@ public class TestMergeOnReadTable {
    client.compact(compactionCommitTime);

    allFiles = HoodieTestUtils.listAllDataFilesInPath(dfs, cfg.getBasePath());
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue(dataFilesToRead.findAny().isPresent());

    // verify that there is a commit
    HoodieTable table = HoodieTable.getHoodieTable(
-        new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath(), true),
-        getConfig(false));
+        new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath(), true), getConfig(false));
    HoodieTimeline timeline = table.getCommitTimeline().filterCompletedInstants();
-    assertEquals("Expecting a single commit.", 1,
-        timeline.findInstantsAfter("000", Integer.MAX_VALUE).countInstants());
+    assertEquals("Expecting a single commit.", 1, timeline.findInstantsAfter("000", Integer.MAX_VALUE).countInstants());
    String latestCompactionCommitTime = timeline.lastInstant().get().getTimestamp();
-    assertTrue(HoodieTimeline
-        .compareTimestamps("000", latestCompactionCommitTime, HoodieTimeline.LESSER));
+    assertTrue(HoodieTimeline.compareTimestamps("000", latestCompactionCommitTime, HoodieTimeline.LESSER));

    assertEquals("Must contain 200 records", 200,
        HoodieClientTestUtils.readSince(basePath, sqlContext, timeline, "000").count());
@@ -232,8 +222,7 @@ public class TestMergeOnReadTable {
  // Check if record level metadata is aggregated properly at the end of write.
  @Test
  public void testMetadataAggregateFromWriteStatus() throws Exception {
-    HoodieWriteConfig cfg = getConfigBuilder(false)
-        .withWriteStatusClass(MetadataMergeWriteStatus.class).build();
+    HoodieWriteConfig cfg = getConfigBuilder(false).withWriteStatusClass(MetadataMergeWriteStatus.class).build();
    HoodieWriteClient client = new HoodieWriteClient(jsc, cfg);

    String newCommitTime = "001";
@@ -248,7 +237,8 @@ public class TestMergeOnReadTable {
    Map<String, String> allWriteStatusMergedMetadataMap = MetadataMergeWriteStatus
        .mergeMetadataForWriteStatuses(statuses);
    assertTrue(allWriteStatusMergedMetadataMap.containsKey("InputRecordCount_1506582000"));
-    // For metadata key InputRecordCount_1506582000, value is 2 for each record. So sum of this should be 2 * records.size()
+    // For metadata key InputRecordCount_1506582000, value is 2 for each record. So sum of this
+    // should be 2 * records.size()
    assertEquals(String.valueOf(2 * records.size()),
        allWriteStatusMergedMetadataMap.get("InputRecordCount_1506582000"));
  }
@@ -271,28 +261,23 @@ public class TestMergeOnReadTable {
    List<WriteStatus> statuses = client.upsert(writeRecords, newCommitTime).collect();
    assertNoWriteErrors(statuses);

-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        cfg.getBasePath());
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    HoodieTable hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);

-    Optional<HoodieInstant> deltaCommit =
-        metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
+    Optional<HoodieInstant> deltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
    assertTrue(deltaCommit.isPresent());
    assertEquals("Delta commit should be 001", "001", deltaCommit.get().getTimestamp());

-    Optional<HoodieInstant> commit =
-        metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
+    Optional<HoodieInstant> commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertFalse(commit.isPresent());

-    FileStatus[] allFiles = HoodieTestUtils
-        .listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
+    FileStatus[] allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    TableFileSystemView.ReadOptimizedView roView = new HoodieTableFileSystemView(metaClient,
        hoodieTable.getCommitTimeline().filterCompletedInstants(), allFiles);
    Stream<HoodieDataFile> dataFilesToRead = roView.getLatestDataFiles();
    assertTrue(!dataFilesToRead.findAny().isPresent());

-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue("RealtimeTableView should list the parquet files we wrote in the delta commit",
        dataFilesToRead.findAny().isPresent());
@@ -329,15 +314,12 @@ public class TestMergeOnReadTable {
    assertFalse(commit.isPresent());

    allFiles = HoodieTestUtils.listAllDataFilesInPath(dfs, cfg.getBasePath());
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue(dataFilesToRead.findAny().isPresent());

-    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath())
-        .collect(Collectors.toList());
-    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils
-        .getRecordsUsingInputFormat(dataFiles, basePath);
+    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath()).collect(Collectors.toList());
+    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils.getRecordsUsingInputFormat(dataFiles, basePath);
    //Wrote 40 records and deleted 20 records, so remaining 40-20 = 20
    assertEquals("Must contain 20 records", 20, recordsRead.size());
  }
@@ -365,10 +347,8 @@ public class TestMergeOnReadTable {
    //verify there are no errors
    assertNoWriteErrors(statuses);

-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        cfg.getBasePath());
-    Optional<HoodieInstant> commit =
-        metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
+    Optional<HoodieInstant> commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertTrue(commit.isPresent());
    assertEquals("commit should be 001", "001", commit.get().getTimestamp());

@@ -391,10 +371,8 @@ public class TestMergeOnReadTable {
    client.rollback(newCommitTime);

    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
-    HoodieTable hoodieTable = HoodieTable
-        .getHoodieTable(metaClient, cfg);
-    FileStatus[] allFiles = HoodieTestUtils
-        .listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
+    HoodieTable hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);
+    FileStatus[] allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    HoodieTableFileSystemView roView = new HoodieTableFileSystemView(metaClient,
        hoodieTable.getCompletedCommitTimeline(), allFiles);

@@ -428,28 +406,23 @@ public class TestMergeOnReadTable {
    List<WriteStatus> statuses = client.upsert(writeRecords, newCommitTime).collect();
    assertNoWriteErrors(statuses);

-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        cfg.getBasePath());
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    HoodieTable hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);

-    Optional<HoodieInstant> deltaCommit =
-        metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
+    Optional<HoodieInstant> deltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
    assertTrue(deltaCommit.isPresent());
    assertEquals("Delta commit should be 001", "001", deltaCommit.get().getTimestamp());

-    Optional<HoodieInstant> commit =
-        metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
+    Optional<HoodieInstant> commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertFalse(commit.isPresent());

-    FileStatus[] allFiles = HoodieTestUtils
-        .listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
+    FileStatus[] allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    TableFileSystemView.ReadOptimizedView roView = new HoodieTableFileSystemView(metaClient,
        hoodieTable.getCommitTimeline().filterCompletedInstants(), allFiles);
    Stream<HoodieDataFile> dataFilesToRead = roView.getLatestDataFiles();
    assertTrue(!dataFilesToRead.findAny().isPresent());

-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue("RealtimeTableView should list the parquet files we wrote in the delta commit",
        dataFilesToRead.findAny().isPresent());
@@ -473,10 +446,8 @@ public class TestMergeOnReadTable {
    commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertFalse(commit.isPresent());

-    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath())
-        .collect(Collectors.toList());
-    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils
-        .getRecordsUsingInputFormat(dataFiles, basePath);
+    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath()).collect(Collectors.toList());
+    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils.getRecordsUsingInputFormat(dataFiles, basePath);

    assertEquals(recordsRead.size(), 200);

@@ -485,8 +456,7 @@ public class TestMergeOnReadTable {

    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath()).collect(Collectors.toList());
    recordsRead = HoodieMergeOnReadTestUtils.getRecordsUsingInputFormat(dataFiles, basePath);

@@ -512,11 +482,10 @@ public class TestMergeOnReadTable {
    allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCommitsTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCommitsTimeline(), allFiles);

-    final String compactedCommitTime = metaClient.getActiveTimeline().reload()
-        .getCommitsTimeline().lastInstant().get().getTimestamp();
+    final String compactedCommitTime = metaClient.getActiveTimeline().reload().getCommitsTimeline().lastInstant().get()
+        .getTimestamp();

    assertTrue(roView.getLatestDataFiles().filter(file -> {
      if (compactedCommitTime.equals(file.getCommitTime())) {
@@ -531,8 +500,7 @@ public class TestMergeOnReadTable {
    allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCommitsTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCommitsTimeline(), allFiles);

    assertFalse(roView.getLatestDataFiles().filter(file -> {
      if (compactedCommitTime.equals(file.getCommitTime())) {
@@ -564,30 +532,28 @@ public class TestMergeOnReadTable {
    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), cfg.getBasePath());
    HoodieTable hoodieTable = HoodieTable.getHoodieTable(metaClient, cfg);

-    Optional<HoodieInstant> deltaCommit =
-        metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
+    Optional<HoodieInstant> deltaCommit = metaClient.getActiveTimeline().getDeltaCommitTimeline().firstInstant();
    assertTrue(deltaCommit.isPresent());
    assertEquals("Delta commit should be 001", "001", deltaCommit.get().getTimestamp());

-    Optional<HoodieInstant> commit =
-        metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
+    Optional<HoodieInstant> commit = metaClient.getActiveTimeline().getCommitTimeline().firstInstant();
    assertFalse(commit.isPresent());

-    FileStatus[] allFiles = HoodieTestUtils
-        .listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
+    FileStatus[] allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
    TableFileSystemView.ReadOptimizedView roView = new HoodieTableFileSystemView(metaClient,
        hoodieTable.getCommitsTimeline().filterCompletedInstants(), allFiles);
    Stream<HoodieDataFile> dataFilesToRead = roView.getLatestDataFiles();
-    Map<String, Long> parquetFileIdToSize = dataFilesToRead.collect(Collectors.toMap(HoodieDataFile::getFileId, HoodieDataFile::getFileSize));
+    Map<String, Long> parquetFileIdToSize = dataFilesToRead.collect(
+        Collectors.toMap(HoodieDataFile::getFileId, HoodieDataFile::getFileSize));

-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(),
-        allFiles);
+    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getCompletedCommitTimeline(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
    assertTrue("RealtimeTableView should list the parquet files we wrote in the delta commit",
        dataFilesToRead.findAny().isPresent());

    /**
-     * Write 2 (only updates + inserts, written to .log file + correction of existing parquet file size)
+     * Write 2 (only updates + inserts, written to .log file + correction of existing parquet
+     * file size)
     */
    newCommitTime = "002";
    client.startCommitWithTime(newCommitTime);
@@ -608,18 +574,17 @@ public class TestMergeOnReadTable {
    assertFalse(commit.isPresent());

    allFiles = HoodieTestUtils.listAllDataFilesInPath(metaClient.getFs(), cfg.getBasePath());
-    roView = new HoodieTableFileSystemView(metaClient, hoodieTable.getActiveTimeline().reload()
-        .getCommitsTimeline().filterCompletedInstants(), allFiles);
+    roView = new HoodieTableFileSystemView(metaClient,
+        hoodieTable.getActiveTimeline().reload().getCommitsTimeline().filterCompletedInstants(), allFiles);
    dataFilesToRead = roView.getLatestDataFiles();
-    Map<String, Long> parquetFileIdToNewSize = dataFilesToRead.collect(Collectors.toMap(HoodieDataFile::getFileId, HoodieDataFile::getFileSize));
+    Map<String, Long> parquetFileIdToNewSize = dataFilesToRead.collect(
+        Collectors.toMap(HoodieDataFile::getFileId, HoodieDataFile::getFileSize));

    assertTrue(parquetFileIdToNewSize.entrySet().stream()
        .filter(entry -> parquetFileIdToSize.get(entry.getKey()) < entry.getValue()).count() > 0);

-    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath())
-        .collect(Collectors.toList());
-    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils
-        .getRecordsUsingInputFormat(dataFiles, basePath);
+    List<String> dataFiles = roView.getLatestDataFiles().map(hf -> hf.getPath()).collect(Collectors.toList());
+    List<GenericRecord> recordsRead = HoodieMergeOnReadTestUtils.getRecordsUsingInputFormat(dataFiles, basePath);
    //Wrote 20 records in 2 batches
    assertEquals("Must contain 40 records", 40, recordsRead.size());
  }
@@ -639,8 +604,7 @@ public class TestMergeOnReadTable {
    List<WriteStatus> statuses = writeClient.insert(recordsRDD, newCommitTime).collect();

    // Update all the 100 records
-    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(),
-        basePath);
+    HoodieTableMetaClient metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    HoodieTable table = HoodieTable.getHoodieTable(metaClient, config);

    newCommitTime = "101";
@@ -653,19 +617,17 @@ public class TestMergeOnReadTable {

    // Write them to corresponding avro logfiles
    HoodieTestUtils
-        .writeRecordsToLogFiles(metaClient.getFs(), metaClient.getBasePath(),
-            HoodieTestDataGenerator.avroSchema, updatedRecords);
+        .writeRecordsToLogFiles(metaClient.getFs(), metaClient.getBasePath(), HoodieTestDataGenerator.avroSchema,
+            updatedRecords);

    // Verify that all data file has one log file
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    table = HoodieTable.getHoodieTable(metaClient, config);
    for (String partitionPath : dataGen.getPartitionPaths()) {
-      List<FileSlice> groupedLogFiles =
-          table.getRTFileSystemView().getLatestFileSlices(partitionPath)
+      List<FileSlice> groupedLogFiles = table.getRTFileSystemView().getLatestFileSlices(partitionPath)
          .collect(Collectors.toList());
      for (FileSlice fileSlice : groupedLogFiles) {
-        assertEquals("There should be 1 log file written for every data file", 1,
-            fileSlice.getLogFiles().count());
+        assertEquals("There should be 1 log file written for every data file", 1, fileSlice.getLogFiles().count());
      }
    }

@@ -674,31 +636,27 @@ public class TestMergeOnReadTable {
    table = HoodieTable.getHoodieTable(metaClient, config);

    String commitTime = writeClient.startCompaction();
-    JavaRDD<WriteStatus> result =
-        writeClient.compact(commitTime);
+    JavaRDD<WriteStatus> result = writeClient.compact(commitTime);

    // Verify that recently written compacted data file has no log file
    metaClient = new HoodieTableMetaClient(jsc.hadoopConfiguration(), basePath);
    table = HoodieTable.getHoodieTable(metaClient, config);
    HoodieActiveTimeline timeline = metaClient.getActiveTimeline();

-    assertTrue("Compaction commit should be > than last insert",
-        HoodieTimeline.compareTimestamps(timeline.lastInstant().get().getTimestamp(), newCommitTime,
-            HoodieTimeline.GREATER));
+    assertTrue("Compaction commit should be > than last insert", HoodieTimeline.compareTimestamps(
+        timeline.lastInstant().get().getTimestamp(), newCommitTime, HoodieTimeline.GREATER));

    for (String partitionPath : dataGen.getPartitionPaths()) {
-      List<FileSlice> groupedLogFiles = table.getRTFileSystemView()
-          .getLatestFileSlices(partitionPath)
+      List<FileSlice> groupedLogFiles = table.getRTFileSystemView().getLatestFileSlices(partitionPath)
          .collect(Collectors.toList());
      for (FileSlice slice : groupedLogFiles) {
-        assertTrue(
-            "After compaction there should be no log files visiable on a Realtime view",
+        assertTrue("After compaction there should be no log files visiable on a Realtime view",
            slice.getLogFiles().collect(Collectors.toList()).isEmpty());
      }
      List<WriteStatus> writeStatuses = result.collect();
      assertTrue(writeStatuses.stream()
-          .filter(writeStatus -> writeStatus.getStat().getPartitionPath()
-              .contentEquals(partitionPath)).count() > 0);
+          .filter(writeStatus -> writeStatus.getStat().getPartitionPath().contentEquals(partitionPath))
+          .count() > 0);
    }
  }

@@ -707,16 +665,13 @@ public class TestMergeOnReadTable {
  }

  private HoodieWriteConfig.Builder getConfigBuilder(Boolean autoCommit) {
-    return HoodieWriteConfig.newBuilder().withPath(basePath)
-        .withSchema(TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
-        .withAutoCommit(autoCommit)
-        .withAssumeDatePartitioning(true)
-        .withCompactionConfig(
-            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024 * 1024)
-                .withInlineCompaction(false).withMaxNumDeltaCommitsBeforeCompaction(1).build())
+    return HoodieWriteConfig.newBuilder().withPath(basePath).withSchema(TRIP_EXAMPLE_SCHEMA).withParallelism(2, 2)
+        .withAutoCommit(autoCommit).withAssumeDatePartitioning(true).withCompactionConfig(
+            HoodieCompactionConfig.newBuilder().compactionSmallFileSize(1024 * 1024 * 1024).withInlineCompaction(false)
+                .withMaxNumDeltaCommitsBeforeCompaction(1).build())
        .withStorageConfig(HoodieStorageConfig.newBuilder().limitFileSize(1024 * 1024 * 1024).build())
-        .forTable("test-trip-table").withIndexConfig(
-            HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build());
+        .forTable("test-trip-table")
+        .withIndexConfig(HoodieIndexConfig.newBuilder().withIndexType(HoodieIndex.IndexType.BLOOM).build());
  }

  private void assertNoWriteErrors(List<WriteStatus> statuses) {
--- a/hoodie-common/src/main/java/com/uber/hoodie/avro/HoodieAvroWriteSupport.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/avro/HoodieAvroWriteSupport.java
@@ -33,10 +33,10 @@ public class HoodieAvroWriteSupport extends AvroWriteSupport {
  private String maxRecordKey;


-  public final static String HOODIE_AVRO_BLOOM_FILTER_METADATA_KEY =
+  public static final String HOODIE_AVRO_BLOOM_FILTER_METADATA_KEY =
      "com.uber.hoodie.bloomfilter";
-  public final static String HOODIE_MIN_RECORD_KEY_FOOTER = "hoodie_min_record_key";
-  public final static String HOODIE_MAX_RECORD_KEY_FOOTER = "hoodie_max_record_key";
+  public static final String HOODIE_MIN_RECORD_KEY_FOOTER = "hoodie_min_record_key";
+  public static final String HOODIE_MAX_RECORD_KEY_FOOTER = "hoodie_max_record_key";


  public HoodieAvroWriteSupport(MessageType schema, Schema avroSchema, BloomFilter bloomFilter) {
--- a/hoodie-common/src/main/java/com/uber/hoodie/avro/MercifulJsonConverter.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/avro/MercifulJsonConverter.java
@@ -16,6 +16,7 @@

 package com.uber.hoodie.avro;

+import com.fasterxml.jackson.databind.ObjectMapper;
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.HashMap;
@@ -24,11 +25,11 @@ import java.util.Map;
 import org.apache.avro.Schema;
 import org.apache.avro.generic.GenericData;
 import org.apache.avro.generic.GenericRecord;
-import com.fasterxml.jackson.databind.ObjectMapper;

 /**
- * Marjority of this is copied from https://github.com/jwills/avro-json/blob/master/src/main/java/com/cloudera/science/avro/common/JsonConverter.java
- * Adjusted for expected behavior of our use cases
+ * Marjority of this is copied from
+ * https://github.com/jwills/avro-json/blob/master/src/main/java/com/cloudera/science/avro/
+ * common/JsonConverter.java Adjusted for expected behavior of our use cases
 */
 public class MercifulJsonConverter {

@@ -132,10 +133,10 @@ public class MercifulJsonConverter {
  }

  private boolean isOptional(Schema schema) {
-    return schema.getType().equals(Schema.Type.UNION) &&
-        schema.getTypes().size() == 2 &&
-        (schema.getTypes().get(0).getType().equals(Schema.Type.NULL) ||
-            schema.getTypes().get(1).getType().equals(Schema.Type.NULL));
+    return schema.getType().equals(Schema.Type.UNION)
+        && schema.getTypes().size() == 2
+        && (schema.getTypes().get(0).getType().equals(Schema.Type.NULL)
+        || schema.getTypes().get(1).getType().equals(Schema.Type.NULL));
  }

  private Schema getNonNull(Schema schema) {
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/HoodieCleanStat.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/HoodieCleanStat.java
@@ -113,9 +113,8 @@ public class HoodieCleanStat implements Serializable {
    }

    public Builder withEarliestCommitRetained(Optional<HoodieInstant> earliestCommitToRetain) {
-      this.earliestCommitToRetain = (earliestCommitToRetain.isPresent()) ?
-          earliestCommitToRetain.get().getTimestamp() :
-          "-1";
+      this.earliestCommitToRetain = (earliestCommitToRetain.isPresent())
+          ? earliestCommitToRetain.get().getTimestamp() : "-1";
      return this;
    }

--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieCommitMetadata.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieCommitMetadata.java
@@ -210,12 +210,18 @@ public class HoodieCommitMetadata implements Serializable {

  @Override
  public boolean equals(Object o) {
-    if (this == o) return true;
-    if (o == null || getClass() != o.getClass()) return false;
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }

    HoodieCommitMetadata that = (HoodieCommitMetadata) o;

-    if (!partitionToWriteStats.equals(that.partitionToWriteStats)) return false;
+    if (!partitionToWriteStats.equals(that.partitionToWriteStats)) {
+      return false;
+    }
    return compacted.equals(that.compacted);

  }
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieFileGroup.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieFileGroup.java
@@ -39,7 +39,6 @@ public class HoodieFileGroup implements Serializable {
    };
  }

-
  /**
   * Partition containing the file group.
   */
@@ -107,8 +106,8 @@ public class HoodieFileGroup implements Serializable {
   */
  private boolean isFileSliceCommitted(FileSlice slice) {
    String maxCommitTime = lastInstant.get().getTimestamp();
-    return timeline.containsOrBeforeTimelineStarts(slice.getBaseCommitTime()) &&
-        HoodieTimeline.compareTimestamps(slice.getBaseCommitTime(),
+    return timeline.containsOrBeforeTimelineStarts(slice.getBaseCommitTime())
+        && HoodieTimeline.compareTimestamps(slice.getBaseCommitTime(),
        maxCommitTime,
        HoodieTimeline.LESSER_OR_EQUAL);

@@ -128,7 +127,7 @@ public class HoodieFileGroup implements Serializable {

  /**
   * Gets the latest slice - this can contain either
-   *
+   * <p>
   * - just the log files without data file - (or) data file with 0 or more log files
   */
  public Optional<FileSlice> getLatestFileSlice() {
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieKey.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieKey.java
@@ -21,7 +21,7 @@ import java.io.Serializable;

 /**
 * HoodieKey consists of
- *
+ * <p>
 * - recordKey     : a recordKey that acts as primary key for a record - partitionPath : path to the
 * partition that contains the record
 */
@@ -54,8 +54,8 @@ public class HoodieKey implements Serializable {
      return false;
    }
    HoodieKey otherKey = (HoodieKey) o;
-    return Objects.equal(recordKey, otherKey.recordKey) &&
-        Objects.equal(partitionPath, otherKey.partitionPath);
+    return Objects.equal(recordKey, otherKey.recordKey)
+        && Objects.equal(partitionPath, otherKey.partitionPath);
  }

  @Override
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieLogFile.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieLogFile.java
@@ -30,7 +30,7 @@ import org.apache.hadoop.fs.Path;
 /**
 * Abstracts a single log file. Contains methods to extract metadata like the fileId, version and
 * extension from the log file path.
- *
+ * <p>
 * Also contains logic to roll-over the log file
 */
 public class HoodieLogFile implements Serializable {
@@ -103,8 +103,12 @@ public class HoodieLogFile implements Serializable {

  @Override
  public boolean equals(Object o) {
-    if (this == o) return true;
-    if (o == null || getClass() != o.getClass()) return false;
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
    HoodieLogFile that = (HoodieLogFile) o;
    return path != null ? path.equals(that.path) : that.path == null;
  }
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodiePartitionMetadata.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodiePartitionMetadata.java
@@ -101,9 +101,8 @@ public class HoodiePartitionMetadata {
      }
    } catch (IOException ioe) {
      log.warn(
-          "Error trying to save partition metadata (this is okay, as long as atleast 1 of these succced), "
-              +
-              partitionPath, ioe);
+          "Error trying to save partition metadata (this is okay, as long as "
+              + "atleast 1 of these succced), " + partitionPath, ioe);
    } finally {
      if (!metafileExists) {
        try {
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecord.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecord.java
@@ -118,10 +118,10 @@ public class HoodieRecord<T extends HoodieRecordPayload> implements Serializable
      return false;
    }
    HoodieRecord that = (HoodieRecord) o;
-    return Objects.equal(key, that.key) &&
-        Objects.equal(data, that.data) &&
-        Objects.equal(currentLocation, that.currentLocation) &&
-        Objects.equal(newLocation, that.newLocation);
+    return Objects.equal(key, that.key)
+        && Objects.equal(data, that.data)
+        && Objects.equal(currentLocation, that.currentLocation)
+        && Objects.equal(newLocation, that.newLocation);
  }

  @Override
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecordLocation.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecordLocation.java
@@ -42,8 +42,8 @@ public class HoodieRecordLocation implements Serializable {
      return false;
    }
    HoodieRecordLocation otherLoc = (HoodieRecordLocation) o;
-    return Objects.equal(commitTime, otherLoc.commitTime) &&
-        Objects.equal(fileId, otherLoc.fileId);
+    return Objects.equal(commitTime, otherLoc.commitTime)
+        && Objects.equal(fileId, otherLoc.fileId);
  }

  @Override
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecordPayload.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieRecordPayload.java
@@ -38,7 +38,7 @@ public interface HoodieRecordPayload<T extends HoodieRecordPayload> extends Seri
  /**
   * This methods lets you write custom merging/combining logic to produce new values as a function
   * of current value on storage and whats contained in this object.
-   *
+   * <p>
   * eg: 1) You are updating counters, you may want to add counts to currentValue and write back
   * updated counts 2) You may be reading DB redo logs, and merge them with current image for a
   * database row on storage
--- a/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieTableType.java
+++ b/hoodie-common/src/main/java/com/uber/hoodie/common/model/HoodieTableType.java
@@ -18,16 +18,16 @@ package com.uber.hoodie.common.model;

 /**
 * Type of the Hoodie Table.
- *
+ * <p>
 * Currently, 1 type is supported
- *
+ * <p>
 * COPY_ON_WRITE - Performs upserts by versioning entire files, with later versions containing newer
 * value of a record.
- *
+ * <p>
 * In the future, following might be added.
- *
+ * <p>
 * MERGE_ON_READ - Speeds up upserts, by delaying merge until enough work piles up.
- *
+ * <p>
 * SIMPLE_LSM    - A simple 2 level LSM tree.
 */
 public enum HoodieTableType {
--- a/Show More
+++ b/Show More