feat(patch): 增加一个patch包用来放hudi相关代码
latest_op_ts相关的内容,直接放在业务包里,spark无法使用,单独打在patch包里,可以方便其他人加到spark jar里
This commit is contained in:
@@ -3,7 +3,7 @@ root_path=$(dirname $(cd $(dirname $0);pwd))
|
|||||||
source $root_path/bin/library.sh
|
source $root_path/bin/library.sh
|
||||||
mvn deploy -N -D skipTests -P local -s ~/.m2/settings-development.xml
|
mvn deploy -N -D skipTests -P local -s ~/.m2/settings-development.xml
|
||||||
deploy service-common service-dependencies service-configuration service-forest service-cli service-cli/service-cli-core service-executor service-executor/service-executor-core utils/executor
|
deploy service-common service-dependencies service-configuration service-forest service-cli service-cli/service-cli-core service-executor service-executor/service-executor-core utils/executor
|
||||||
package service-api service-check service-cli/service-cli-runner service-cloud-query service-executor/service-executor-manager service-executor/service-executor-task service-command service-command-pro service-exporter service-flink-query service-gateway service-hudi-query service-info-query service-monitor service-loki-query service-pulsar-query service-queue service-scheduler service-uploader service-web service-yarn-query service-zookeeper-query utils/sync
|
package service-api service-check service-cli/service-cli-runner service-cloud-query service-executor/service-executor-manager service-executor/service-executor-task service-command service-command-pro service-exporter service-flink-query service-gateway service-hudi-query service-info-query service-monitor service-loki-query service-pulsar-query service-queue service-scheduler service-uploader service-web service-yarn-query service-zookeeper-query utils/patch utils/sync
|
||||||
|
|
||||||
configs=(b2a4 b2b1 b2b5 b2b12)
|
configs=(b2a4 b2b1 b2b5 b2b12)
|
||||||
for config in ${configs[*]};
|
for config in ${configs[*]};
|
||||||
|
|||||||
6
pom.xml
6
pom.xml
@@ -37,6 +37,7 @@
|
|||||||
<module>service-yarn-query</module>
|
<module>service-yarn-query</module>
|
||||||
<module>service-zookeeper-query</module>
|
<module>service-zookeeper-query</module>
|
||||||
<module>utils/sync</module>
|
<module>utils/sync</module>
|
||||||
|
<module>utils/patch</module>
|
||||||
</modules>
|
</modules>
|
||||||
|
|
||||||
<properties>
|
<properties>
|
||||||
@@ -124,6 +125,11 @@
|
|||||||
<artifactId>executor</artifactId>
|
<artifactId>executor</artifactId>
|
||||||
<version>${project.version}</version>
|
<version>${project.version}</version>
|
||||||
</dependency>
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
|
<artifactId>patch</artifactId>
|
||||||
|
<version>${project.version}</version>
|
||||||
|
</dependency>
|
||||||
<dependency>
|
<dependency>
|
||||||
<groupId>com.lanyuanxiaoyao</groupId>
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
<artifactId>sync</artifactId>
|
<artifactId>sync</artifactId>
|
||||||
|
|||||||
69
utils/patch/pom.xml
Normal file
69
utils/patch/pom.xml
Normal file
@@ -0,0 +1,69 @@
|
|||||||
|
<?xml version="1.0" encoding="UTF-8"?>
|
||||||
|
<project xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
|
||||||
|
xmlns="http://maven.apache.org/POM/4.0.0"
|
||||||
|
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
|
||||||
|
<parent>
|
||||||
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
|
<artifactId>hudi-service</artifactId>
|
||||||
|
<version>1.0.0-SNAPSHOT</version>
|
||||||
|
</parent>
|
||||||
|
<modelVersion>4.0.0</modelVersion>
|
||||||
|
|
||||||
|
<artifactId>patch</artifactId>
|
||||||
|
|
||||||
|
<properties>
|
||||||
|
<parquet.version>1.10.1</parquet.version>
|
||||||
|
</properties>
|
||||||
|
|
||||||
|
<dependencies>
|
||||||
|
<dependency>
|
||||||
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
|
<artifactId>service-common</artifactId>
|
||||||
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>org.apache.hudi</groupId>
|
||||||
|
<artifactId>hudi-flink${flink.major.version}-bundle</artifactId>
|
||||||
|
<scope>provided</scope>
|
||||||
|
</dependency>
|
||||||
|
</dependencies>
|
||||||
|
|
||||||
|
<build>
|
||||||
|
<plugins>
|
||||||
|
<plugin>
|
||||||
|
<groupId>org.apache.maven.plugins</groupId>
|
||||||
|
<artifactId>maven-shade-plugin</artifactId>
|
||||||
|
<configuration>
|
||||||
|
<createDependencyReducedPom>false</createDependencyReducedPom>
|
||||||
|
<promoteTransitiveDependencies>true</promoteTransitiveDependencies>
|
||||||
|
<transformers>
|
||||||
|
<transformer implementation="org.apache.maven.plugins.shade.resource.AppendingTransformer">
|
||||||
|
<resource>reference.conf</resource>
|
||||||
|
</transformer>
|
||||||
|
<transformer
|
||||||
|
implementation="org.apache.maven.plugins.shade.resource.ServicesResourceTransformer"/>
|
||||||
|
</transformers>
|
||||||
|
<filters>
|
||||||
|
<filter>
|
||||||
|
<artifact>*:*</artifact>
|
||||||
|
<excludes>
|
||||||
|
<exclude>META-INF/*.SF</exclude>
|
||||||
|
<exclude>META-INF/*.DSA</exclude>
|
||||||
|
<exclude>META-INF/*.RSA</exclude>
|
||||||
|
<exclude>log4j-surefire*.properties</exclude>
|
||||||
|
</excludes>
|
||||||
|
</filter>
|
||||||
|
</filters>
|
||||||
|
</configuration>
|
||||||
|
<executions>
|
||||||
|
<execution>
|
||||||
|
<phase>package</phase>
|
||||||
|
<goals>
|
||||||
|
<goal>shade</goal>
|
||||||
|
</goals>
|
||||||
|
</execution>
|
||||||
|
</executions>
|
||||||
|
</plugin>
|
||||||
|
</plugins>
|
||||||
|
</build>
|
||||||
|
|
||||||
|
</project>
|
||||||
@@ -0,0 +1,57 @@
|
|||||||
|
package org.apache.hudi.client;
|
||||||
|
|
||||||
|
import com.lanyuanxiaoyao.service.common.Constants;
|
||||||
|
import java.time.LocalDateTime;
|
||||||
|
import java.time.ZoneOffset;
|
||||||
|
import java.time.format.DateTimeFormatter;
|
||||||
|
import java.util.Map;
|
||||||
|
import org.apache.hudi.common.model.HoodieRecord;
|
||||||
|
import org.apache.hudi.common.util.Option;
|
||||||
|
import org.apache.hudi.common.util.StringUtils;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @author lanyuanxiaoyao
|
||||||
|
* @date 2023-04-17
|
||||||
|
*/
|
||||||
|
public class TraceWriteStatus extends WriteStatus {
|
||||||
|
private static final Logger logger = LoggerFactory.getLogger(TraceWriteStatus.class);
|
||||||
|
private static final DateTimeFormatter FORMATTER = DateTimeFormatter.ofPattern("yyyy-MM-dd HH:mm:ss");
|
||||||
|
private long latestOpts = 0L;
|
||||||
|
|
||||||
|
public TraceWriteStatus() {
|
||||||
|
super();
|
||||||
|
}
|
||||||
|
|
||||||
|
public TraceWriteStatus(Boolean trackSuccessRecords, Double failureFraction) {
|
||||||
|
super(trackSuccessRecords, failureFraction);
|
||||||
|
}
|
||||||
|
|
||||||
|
public long getLatestOpts() {
|
||||||
|
return latestOpts;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void markSuccess(HoodieRecord record, Option<Map<String, String>> optionalRecordMetadata) {
|
||||||
|
super.markSuccess(record, optionalRecordMetadata);
|
||||||
|
try {
|
||||||
|
optionalRecordMetadata.ifPresent(map -> {
|
||||||
|
if (map.containsKey(Constants.LATEST_OPERATION_TIMESTAMP_KEY_NAME)) {
|
||||||
|
String inOpts = map.get(Constants.LATEST_OPERATION_TIMESTAMP_KEY_NAME);
|
||||||
|
if (StringUtils.nonEmpty(inOpts)) {
|
||||||
|
long current = LocalDateTime.parse(inOpts, FORMATTER).toInstant(ZoneOffset.ofHours(8)).toEpochMilli();
|
||||||
|
latestOpts = Long.max(latestOpts, current);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
});
|
||||||
|
} catch (Throwable throwable) {
|
||||||
|
logger.error("Parse latest opts failure", throwable);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void markFailure(HoodieRecord record, Throwable t, Option<Map<String, String>> optionalRecordMetadata) {
|
||||||
|
super.markFailure(record, t, optionalRecordMetadata);
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,57 @@
|
|||||||
|
package org.apache.hudi.common.model;
|
||||||
|
|
||||||
|
import com.lanyuanxiaoyao.service.common.Constants;
|
||||||
|
import java.util.HashMap;
|
||||||
|
import java.util.Map;
|
||||||
|
import org.apache.hudi.common.util.Option;
|
||||||
|
import org.apache.hudi.org.apache.avro.generic.GenericRecord;
|
||||||
|
import org.apache.hudi.org.apache.avro.util.Utf8;
|
||||||
|
import org.apache.hudi.table.HoodieTableFactory;
|
||||||
|
import org.slf4j.Logger;
|
||||||
|
import org.slf4j.LoggerFactory;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* 通过将latest_op_ts值写入payload进行传递,使压缩完成后可以从status中获取该值
|
||||||
|
* Hudi默认使用{@link OverwriteWithLatestAvroPayload},由于{@link HoodieTableFactory}156行中的说明
|
||||||
|
* 如果使用默认值,则改为使用{@link EventTimeAvroPayload},所以这里的payload直接继承EventTimeAvroPayload
|
||||||
|
* 从而符合原来的使用逻辑
|
||||||
|
*
|
||||||
|
* @author lanyuanxiaoyao
|
||||||
|
* @date 2023-04-18
|
||||||
|
*/
|
||||||
|
public class TraceEventTimeAvroPayload extends EventTimeAvroPayload {
|
||||||
|
private static final Logger logger = LoggerFactory.getLogger(TraceEventTimeAvroPayload.class);
|
||||||
|
|
||||||
|
private final String latestOpts;
|
||||||
|
|
||||||
|
public TraceEventTimeAvroPayload(GenericRecord record, Comparable orderingVal) {
|
||||||
|
super(record, orderingVal);
|
||||||
|
this.latestOpts = updateLatestOpts(Option.ofNullable(record));
|
||||||
|
}
|
||||||
|
|
||||||
|
public TraceEventTimeAvroPayload(Option<GenericRecord> record) {
|
||||||
|
super(record);
|
||||||
|
this.latestOpts = updateLatestOpts(record);
|
||||||
|
}
|
||||||
|
|
||||||
|
private String updateLatestOpts(Option<GenericRecord> record) {
|
||||||
|
try {
|
||||||
|
return record
|
||||||
|
.map(r -> ((Utf8) r.get(Constants.LATEST_OPERATION_TIMESTAMP_KEY_NAME)).toString())
|
||||||
|
.orElse(null);
|
||||||
|
} catch (Throwable throwable) {
|
||||||
|
logger.error("Get latest opts failure", throwable);
|
||||||
|
}
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Option<Map<String, String>> getMetadata() {
|
||||||
|
if (this.latestOpts == null) {
|
||||||
|
return Option.empty();
|
||||||
|
}
|
||||||
|
Map<String, String> metadata = super.getMetadata().orElse(new HashMap<>());
|
||||||
|
metadata.put(Constants.LATEST_OPERATION_TIMESTAMP_KEY_NAME, this.latestOpts);
|
||||||
|
return Option.of(metadata);
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -20,6 +20,10 @@
|
|||||||
<groupId>com.lanyuanxiaoyao</groupId>
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
<artifactId>service-common</artifactId>
|
<artifactId>service-common</artifactId>
|
||||||
</dependency>
|
</dependency>
|
||||||
|
<dependency>
|
||||||
|
<groupId>com.lanyuanxiaoyao</groupId>
|
||||||
|
<artifactId>patch</artifactId>
|
||||||
|
</dependency>
|
||||||
<dependency>
|
<dependency>
|
||||||
<groupId>org.apache.hudi</groupId>
|
<groupId>org.apache.hudi</groupId>
|
||||||
<artifactId>hudi-flink${flink.major.version}-bundle</artifactId>
|
<artifactId>hudi-flink${flink.major.version}-bundle</artifactId>
|
||||||
|
|||||||
Reference in New Issue
Block a user