1
0

[HUDI-4210] Create custom hbase index to solve data skew issue on hbase regions (#5797)

This commit is contained in:
冯健
2022-07-26 18:09:17 +08:00
committed by GitHub
parent 1ea1e659c2
commit e5faf2cc84
4 changed files with 53 additions and 3 deletions

View File

@@ -183,6 +183,10 @@ public class HoodieHBaseIndexConfig extends HoodieConfig {
.noDefaultValue()
.withDocumentation("The value of hbase.master.kerberos.principal in hbase cluster.");
public static final ConfigProperty<Integer> BUCKET_NUMBER = ConfigProperty
.key("hoodie.index.hbase.bucket.number")
.defaultValue(8)
.withDocumentation("Only applicable when using RebalancedSparkHoodieHBaseIndex, same as hbase regions count can get the best performance");
/**
* @deprecated Use {@link #ZKQUORUM} and its methods instead

View File

@@ -1553,6 +1553,10 @@ public class HoodieWriteConfig extends HoodieConfig {
return getBooleanOrDefault(HoodieHBaseIndexConfig.UPDATE_PARTITION_PATH_ENABLE);
}
public int getHBaseIndexRegionCount() {
return getInt(HoodieHBaseIndexConfig.BUCKET_NUMBER);
}
public int getBloomIndexParallelism() {
return getInt(HoodieIndexConfig.BLOOM_INDEX_PARALLELISM);
}