[HUDI-2837] Add support for using database name in incremental query (#4083)
This commit is contained in:
@@ -85,6 +85,7 @@ object HoodieSparkSqlWriter {
|
||||
validateTableConfig(sqlContext.sparkSession, optParams, tableConfig)
|
||||
|
||||
val (parameters, hoodieConfig) = mergeParamsAndGetHoodieConfig(optParams, tableConfig)
|
||||
val databaseName = hoodieConfig.getStringOrDefault(HoodieTableConfig.DATABASE_NAME, "")
|
||||
val tblName = hoodieConfig.getStringOrThrow(HoodieWriteConfig.TBL_NAME,
|
||||
s"'${HoodieWriteConfig.TBL_NAME.key}' must be set.").trim
|
||||
assert(!StringUtils.isNullOrEmpty(hoodieConfig.getString(HoodieWriteConfig.TBL_NAME)),
|
||||
@@ -131,6 +132,7 @@ object HoodieSparkSqlWriter {
|
||||
|
||||
val tableMetaClient = HoodieTableMetaClient.withPropertyBuilder()
|
||||
.setTableType(tableType)
|
||||
.setDatabaseName(databaseName)
|
||||
.setTableName(tblName)
|
||||
.setRecordKeyFields(recordKeyFields)
|
||||
.setBaseFileFormat(baseFileFormat)
|
||||
|
||||
@@ -21,8 +21,7 @@ import org.apache.hudi.AvroConversionUtils
|
||||
import org.apache.hudi.HoodieWriterUtils._
|
||||
import org.apache.hudi.common.config.DFSPropertiesConfiguration
|
||||
import org.apache.hudi.common.model.HoodieTableType
|
||||
import org.apache.hudi.common.table.HoodieTableConfig
|
||||
import org.apache.hudi.common.table.HoodieTableMetaClient
|
||||
import org.apache.hudi.common.table.{HoodieTableConfig, HoodieTableMetaClient}
|
||||
import org.apache.hudi.common.util.ValidationUtils
|
||||
import org.apache.hudi.keygen.ComplexKeyGenerator
|
||||
import org.apache.hudi.keygen.factory.HoodieSparkKeyGeneratorFactory
|
||||
@@ -184,8 +183,10 @@ class HoodieCatalogTable(val spark: SparkSession, val table: CatalogTable) exten
|
||||
} else {
|
||||
val (recordName, namespace) = AvroConversionUtils.getAvroRecordNameAndNamespace(table.identifier.table)
|
||||
val schema = SchemaConverters.toAvroType(finalSchema, false, recordName, namespace)
|
||||
val hoodieDatabaseName = formatName(spark, table.identifier.database.getOrElse(spark.sessionState.catalog.getCurrentDatabase))
|
||||
HoodieTableMetaClient.withPropertyBuilder()
|
||||
.fromProperties(properties)
|
||||
.setDatabaseName(hoodieDatabaseName)
|
||||
.setTableName(table.identifier.table)
|
||||
.setTableCreateSchema(schema.toString())
|
||||
.setPartitionFields(table.partitionColumnNames.mkString(","))
|
||||
|
||||
@@ -202,11 +202,11 @@ object HoodieOptionConfig {
|
||||
s"Can't find primaryKey `$primaryKey` in ${schema.treeString}.")
|
||||
}
|
||||
|
||||
// validate precombine key
|
||||
val precombineKey = sqlOptions.get(SQL_KEY_PRECOMBINE_FIELD.sqlKeyName)
|
||||
if (precombineKey.isDefined && precombineKey.get.nonEmpty) {
|
||||
ValidationUtils.checkArgument(schema.exists(f => resolver(f.name, precombineKey.get)),
|
||||
s"Can't find preCombineKey `${precombineKey.get}` in ${schema.treeString}.")
|
||||
// validate preCombine key
|
||||
val preCombineKey = sqlOptions.get(SQL_KEY_PRECOMBINE_FIELD.sqlKeyName)
|
||||
if (preCombineKey.isDefined && preCombineKey.get.nonEmpty) {
|
||||
ValidationUtils.checkArgument(schema.exists(f => resolver(f.name, preCombineKey.get)),
|
||||
s"Can't find preCombineKey `${preCombineKey.get}` in ${schema.treeString}.")
|
||||
}
|
||||
|
||||
// validate table type
|
||||
|
||||
@@ -123,12 +123,12 @@ object CreateHoodieTableCommand {
|
||||
table.storage.compressed,
|
||||
storageProperties + ("path" -> path))
|
||||
|
||||
val tablName = HoodieSqlCommonUtils.formatName(sparkSession, table.identifier.table)
|
||||
val tableName = HoodieSqlCommonUtils.formatName(sparkSession, table.identifier.table)
|
||||
val newDatabaseName = HoodieSqlCommonUtils.formatName(sparkSession, table.identifier.database
|
||||
.getOrElse(catalog.getCurrentDatabase))
|
||||
|
||||
val newTableIdentifier = table.identifier
|
||||
.copy(table = tablName, database = Some(newDatabaseName))
|
||||
.copy(table = tableName, database = Some(newDatabaseName))
|
||||
|
||||
val partitionColumnNames = hoodieCatalogTable.partitionSchema.map(_.name)
|
||||
// append pk, preCombineKey, type to the properties of table
|
||||
|
||||
@@ -50,7 +50,7 @@ class TruncateHoodieTableCommand(
|
||||
}
|
||||
|
||||
// If we have not specified the partition, truncate will delete all the data in the table path
|
||||
// include the hoodi.properties. In this case we should reInit the table.
|
||||
// include the hoodie.properties. In this case we should reInit the table.
|
||||
if (partitionSpec.isEmpty) {
|
||||
val hadoopConf = sparkSession.sessionState.newHadoopConf()
|
||||
// ReInit hoodie.properties
|
||||
|
||||
@@ -115,7 +115,7 @@ class ExpressionPayload(record: GenericRecord,
|
||||
if (targetRecord.isEmpty || needUpdatingPersistedRecord(targetRecord.get, resultRecord, properties)) {
|
||||
resultRecordOpt = HOption.of(resultRecord)
|
||||
} else {
|
||||
// if the PreCombine field value of targetRecord is greate
|
||||
// if the PreCombine field value of targetRecord is greater
|
||||
// than the new incoming record, just keep the old record value.
|
||||
resultRecordOpt = HOption.of(targetRecord.get)
|
||||
}
|
||||
@@ -270,7 +270,7 @@ class ExpressionPayload(record: GenericRecord,
|
||||
object ExpressionPayload {
|
||||
|
||||
/**
|
||||
* Property for pass the merge-into delete clause condition expresssion.
|
||||
* Property for pass the merge-into delete clause condition expression.
|
||||
*/
|
||||
val PAYLOAD_DELETE_CONDITION = "hoodie.payload.delete.condition"
|
||||
|
||||
|
||||
Reference in New Issue
Block a user