feat(monitor): 增加指标输出模块

一些外部指标查询通过指标输出模块输出,避免对原业务模块产生影响
This commit is contained in:
2024-03-05 12:21:38 +08:00
parent 41d5a6b264
commit d4e161459a
14 changed files with 355 additions and 12 deletions

View File

@@ -1,3 +1,12 @@
GET http://AxhEbscwsJDbYMH2:cYxg3b4PtWoVD5SjFayWxtnSVsjzRsg4@b12s15.hdp.dc:21685/pulsar/backlog?name=main&topic=persistent://odcp/grid/grid_serv_staff&subscription=Hudi_Sync_Pulsar_Reader_1552408245762723840_grid_grid_serv_staff_b_20230425
Connection: Keep-Alive
User-Agent: Apache-HttpClient/4.5.14 (Java/17.0.10)
Accept-Encoding: br,deflate,gzip,x-gzip
<> 2024-03-05T111533.200.json
###
GET http://AxhEbscwsJDbYMH2:cYxg3b4PtWoVD5SjFayWxtnSVsjzRsg4@132.126.207.130:35690/hudi_services/service-exporter/exporter/un_running_flink_job
Connection: Keep-Alive
User-Agent: Apache-HttpClient/4.5.14 (Java/17.0.9)
@@ -398,11 +407,3 @@ Accept-Encoding: br,deflate,gzip,x-gzip
###
GET http://AxhEbscwsJDbYMH2:cYxg3b4PtWoVD5SjFayWxtnSVsjzRsg4@132.126.207.130:35690/hudi_services/queue/queue/clear?name=compaction-queue-pre
Connection: Keep-Alive
User-Agent: Apache-HttpClient/4.5.14 (Java/17.0.9)
Cookie: JSESSIONID=9AB8D98C10FACE15EA1CB758D79F8877
Accept-Encoding: br,deflate,gzip,x-gzip
###

6
bin/build-monitor.sh Executable file
View File

@@ -0,0 +1,6 @@
#!/bin/bash
root_path=$(dirname $(cd $(dirname $0);pwd))
source $root_path/bin/library.sh
mvn -pl service-common,service-dependencies,service-configuration clean deploy -D skipTests -P local -s ~/.m2/settings-development.xml
mvn -pl service-monitor clean package spring-boot:repackage -D skipTests -s ~/.m2/settings-development.xml
upload $root_path/service-monitor/target/service-monitor-1.0.0-SNAPSHOT.jar

View File

@@ -26,6 +26,7 @@
<module>service-info-query</module>
<module>service-launcher</module>
<module>service-loki-query</module>
<module>service-monitor</module>
<module>service-pulsar-query</module>
<module>service-queue</module>
<module>service-scheduler</module>

View File

@@ -168,3 +168,9 @@ deploy:
- "service"
source-jar: service-exporter-1.0.0-SNAPSHOT.jar
replicas: 3
service-monitor:
order: 5
groups:
- "service"
source-jar: service-monitor-1.0.0-SNAPSHOT.jar
replicas: 1

View File

@@ -84,10 +84,12 @@ public interface Constants {
String DATA_TIME = "data-time";
String DATA_PARENT_PATH = "data-parent-path";
String METRICS_PREFIX = "metrics_hudi";
String METRICS_PREFIX = "service";
String METRICS_YARN_PREFIX = METRICS_PREFIX + "_yarn";
String METRICS_YARN_JOB = METRICS_YARN_PREFIX + "_job";
String METRICS_YARN_TABLE = METRICS_YARN_PREFIX + "_table";
String METRICS_SYNC_PREFIX = METRICS_PREFIX + "_sync";
String METRICS_SYNC_SOURCE_LATENCY = METRICS_SYNC_PREFIX + "_source_latency";
String METRICS_SYNC_LATENCY = METRICS_SYNC_PREFIX + "_latency";
@@ -100,6 +102,12 @@ public interface Constants {
String METRICS_SYNC_SOURCE_CHANGE_PARTITION = METRICS_SYNC_PREFIX + "_source_change_partition";
String METRICS_SYNC_SOURCE_BACK_LOGS = METRICS_SYNC_PREFIX + "_source_back_logs";
String METRICS_QUEUE_PREFIX = METRICS_PREFIX + "_queue";
String METRICS_QUEUE_SIZE = METRICS_QUEUE_PREFIX + "_size";
String METRICS_PULSAR_PREFIX = METRICS_PREFIX + "_pulsar";
String METRICS_PULSAR_BACKLOG = METRICS_PULSAR_PREFIX + "_backlog";
String METRICS_LABEL_FLINK_JOB_ID = "flink_job_id";
String METRICS_LABEL_FLINK_JOB_NAME = "flink_job_name";
String METRICS_LABEL_FLINK_NATIVE_JOB_ID = "flink_native_job_id";
@@ -124,6 +132,7 @@ public interface Constants {
String METRICS_STATUS_STOPPED = "stopped";
String METRICS_LABEL_TYPE = "type";
String METRICS_LABEL_NAME = "name";
String LOKI_PUSH_URL = "loki_push_url";

41
service-monitor/pom.xml Normal file
View File

@@ -0,0 +1,41 @@
<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
<modelVersion>4.0.0</modelVersion>
<parent>
<groupId>com.lanyuanxiaoyao</groupId>
<artifactId>hudi-service</artifactId>
<version>1.0.0-SNAPSHOT</version>
</parent>
<artifactId>service-monitor</artifactId>
<dependencies>
<dependency>
<groupId>com.lanyuanxiaoyao</groupId>
<artifactId>service-dependencies</artifactId>
</dependency>
<dependency>
<groupId>com.lanyuanxiaoyao</groupId>
<artifactId>service-configuration</artifactId>
</dependency>
<dependency>
<groupId>com.lanyuanxiaoyao</groupId>
<artifactId>service-forest</artifactId>
</dependency>
</dependencies>
<build>
<plugins>
<plugin>
<groupId>org.apache.maven.plugins</groupId>
<artifactId>maven-source-plugin</artifactId>
</plugin>
<plugin>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-maven-plugin</artifactId>
</plugin>
</plugins>
</build>
</project>

View File

@@ -0,0 +1,27 @@
package com.lanyuanxiaoyao.service.monitor;
import com.ulisesbocchio.jasyptspringboot.annotation.EnableEncryptableProperties;
import org.springframework.boot.SpringApplication;
import org.springframework.boot.autoconfigure.SpringBootApplication;
import org.springframework.boot.context.properties.EnableConfigurationProperties;
import org.springframework.cloud.client.discovery.EnableDiscoveryClient;
import org.springframework.retry.annotation.EnableRetry;
import org.springframework.scheduling.annotation.EnableScheduling;
/**
* @author lanyuanxiaoyao
* @date 2024-03-05
*/
@EnableDiscoveryClient
@SpringBootApplication(
scanBasePackages = {"com.lanyuanxiaoyao.service"}
)
@EnableConfigurationProperties
@EnableEncryptableProperties
@EnableRetry
@EnableScheduling
public class MonitorApplication {
public static void main(String[] args) {
SpringApplication.run(MonitorApplication.class, args);
}
}

View File

@@ -0,0 +1,9 @@
package com.lanyuanxiaoyao.service.monitor.metric;
/**
* @author lanyuanxiaoyao
* @date 2024-03-05
*/
public abstract class Metrics {
abstract void update();
}

View File

@@ -0,0 +1,76 @@
package com.lanyuanxiaoyao.service.monitor.metric;
import cn.hutool.core.util.StrUtil;
import com.lanyuanxiaoyao.service.common.Constants;
import com.lanyuanxiaoyao.service.common.utils.NameHelper;
import com.lanyuanxiaoyao.service.configuration.ExecutorProvider;
import com.lanyuanxiaoyao.service.forest.service.InfoService;
import com.lanyuanxiaoyao.service.forest.service.PulsarService;
import io.micrometer.core.instrument.MeterRegistry;
import io.micrometer.core.instrument.Tag;
import java.util.Map;
import java.util.concurrent.atomic.AtomicLong;
import org.eclipse.collections.api.factory.Lists;
import org.eclipse.collections.api.factory.Maps;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.scheduling.annotation.Scheduled;
import org.springframework.stereotype.Service;
import static com.lanyuanxiaoyao.service.common.Constants.MINUTE;
/**
* Pulsar
*
* @author lanyuanxiaoyao
* @date 2024-03-05
*/
@SuppressWarnings("SpringJavaInjectionPointsAutowiringInspection")
@Service
public class PulsarMetrics extends Metrics {
private static final Logger logger = LoggerFactory.getLogger(PulsarMetrics.class);
private final MeterRegistry registry;
private final InfoService infoService;
private final PulsarService pulsarService;
private final Map<String, AtomicLong> backlogMap;
public PulsarMetrics(MeterRegistry registry, InfoService infoService, PulsarService pulsarService) {
this.registry = registry;
this.infoService = infoService;
this.pulsarService = pulsarService;
backlogMap = Maps.mutable.empty();
}
@Scheduled(fixedDelay = MINUTE, initialDelay = MINUTE)
@Override
void update() {
infoService.tableMetaList()
// .asParallel(ExecutorProvider.EXECUTORS, 50)
.reject(meta -> StrUtil.isBlank(meta.getPulsarAddress()))
.forEach(meta -> {
try {
String name = pulsarService.name(meta.getPulsarAddress());
Long backlog = pulsarService.backlog(name, meta.getTopic(), NameHelper.pulsarSubscriptionName(meta.getJob().getId(), meta.getAlias()));
AtomicLong backlogCache = backlogMap.getOrDefault(
meta.getAlias(),
registry.gauge(
Constants.METRICS_PULSAR_BACKLOG,
Lists.immutable.of(
Tag.of(Constants.METRICS_LABEL_FLINK_JOB_ID, meta.getJob().getId().toString()),
Tag.of(Constants.METRICS_LABEL_ALIAS, meta.getAlias()),
Tag.of(Constants.METRICS_LABEL_SCHEMA, meta.getSchema()),
Tag.of(Constants.METRICS_LABEL_TABLE, meta.getTable())
),
new AtomicLong()
)
);
backlogCache.set(backlog);
} catch (Exception e) {
logger.warn("Something bad for " + meta.getAlias(), e);
}
});
}
}

View File

@@ -0,0 +1,5 @@
spring:
application:
name: service-monitor
profiles:
include: random-port,common,discovery,metrics,forest

View File

@@ -0,0 +1,52 @@
<configuration>
<conversionRule conversionWord="clr" converterClass="org.springframework.boot.logging.logback.ColorConverter" />
<conversionRule conversionWord="wex" converterClass="org.springframework.boot.logging.logback.WhitespaceThrowableProxyConverter" />
<conversionRule conversionWord="wEx" converterClass="org.springframework.boot.logging.logback.ExtendedWhitespaceThrowableProxyConverter" />
<springProperty scope="context" name="LOKI_PUSH_URL" source="loki.url"/>
<springProperty scope="context" name="LOGGING_PARENT" source="logging.parent"/>
<springProperty scope="context" name="APP_NAME" source="spring.application.name"/>
<appender name="Loki" class="com.github.loki4j.logback.Loki4jAppender">
<metricsEnabled>true</metricsEnabled>
<http class="com.github.loki4j.logback.ApacheHttpSender">
<url>${LOKI_PUSH_URL:-http://localhost/loki/api/v1/push}</url>
</http>
<format>
<label>
<pattern>app=${APP_NAME:-none},host=${HOSTNAME:-none},level=%level</pattern>
<readMarkers>true</readMarkers>
</label>
<message>
<pattern>%d{yyyy-MM-dd HH:mm:ss.SSS} %p [${HOSTNAME}] [%t] %logger #@# %m%n%wEx</pattern>
</message>
<sortByTime>true</sortByTime>
</format>
</appender>
<appender name="Console" class="ch.qos.logback.core.ConsoleAppender">
<encoder>
<pattern>%d{yyyy-MM-dd HH:mm:ss.SSS} %clr(%5p) %clr([${HOSTNAME}]){yellow} %clr([%t]){magenta} %clr(%logger{40}){cyan} #@# %m%n%wEx</pattern>
</encoder>
</appender>
<appender name="RollingFile" class="ch.qos.logback.core.rolling.RollingFileAppender">
<file>${LOGGING_PARENT:-.}/${APP_NAME:-run}.log</file>
<rollingPolicy class="ch.qos.logback.core.rolling.TimeBasedRollingPolicy">
<fileNamePattern>${LOGGING_PARENT:-.}/archive/${APP_NAME:-run}-%d{yyyy-MM-dd}.gz</fileNamePattern>
<MaxHistory>7</MaxHistory>
</rollingPolicy>
<encoder>
<pattern>%d{yyyy-MM-dd HH:mm:ss.SSS} %p [${HOSTNAME}] [%t] %logger #@# %m%n%wEx</pattern>
</encoder>
</appender>
<logger name="com.zaxxer.hikari" level="ERROR"/>
<logger name="com.netflix.discovery.shared.resolver.aws.ConfigClusterResolver" level="WARN"/>
<root level="INFO">
<appender-ref ref="Loki"/>
<appender-ref ref="Console"/>
<appender-ref ref="RollingFile"/>
</root>
</configuration>

View File

@@ -1,5 +1,6 @@
package com.lanyuanxiaoyao.service.queue.controller;
import com.lanyuanxiaoyao.service.common.Constants;
import io.micrometer.core.instrument.MeterRegistry;
import io.micrometer.core.instrument.Tag;
import java.util.Collection;
@@ -17,10 +18,10 @@ public abstract class QueueOperator {
protected void updateMetrics(MeterRegistry registry, String name, Map<String, ? extends Collection<?>> map) {
map.forEach((queue, collection) -> registry.gaugeCollectionSize(
"service_queue_size",
Constants.METRICS_QUEUE_SIZE,
Lists.immutable.of(
Tag.of("type", name),
Tag.of("name", queue)
Tag.of(Constants.METRICS_LABEL_TYPE, name),
Tag.of(Constants.METRICS_LABEL_NAME, queue)
),
collection
));

View File

@@ -93,3 +93,6 @@ GET {{web-url}}/test
### 获取未运行的同步任务
GET {{exporter-url}}/exporter/un_running_flink_job
### Pulsar backlog
GET http://{{username}}:{{password}}@b12s15.hdp.dc:21685/pulsar/backlog?name=main&topic=persistent://odcp/grid/grid_serv_staff&subscription=Hudi_Sync_Pulsar_Reader_1552408245762723840_grid_grid_serv_staff_b_20230425

View File

@@ -0,0 +1,106 @@
package com.lanyuanxiaoyao.service.sync;
import com.fasterxml.jackson.core.JsonProcessingException;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.lanyuanxiaoyao.service.common.entity.Record;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* @author lanyuanxiaoyao
* @date 2024-03-04
*/
public class MessageParseTest {
private static final Logger logger = LoggerFactory.getLogger(MessageParseTest.class);
public static void main(String[] args) throws JsonProcessingException {
// language=JSON
String message = "{\n" +
" \"source\": {\n" +
" \"sourceId\": \"set_4846458104\",\n" +
" \"sourceType\": null,\n" +
" \"sourcePos\": \"mysql-bin.013514:245945070\",\n" +
" \"currentTs\": \"2024-03-02 06:29:04\"\n" +
" },\n" +
" \"statement\": {\n" +
" \"schema\": \"acct_sz\",\n" +
" \"table\": \"acct_item\",\n" +
" \"opStatement\": null,\n" +
" \"opType\": \"U\",\n" +
" \"op\": null,\n" +
" \"opTs\": \"2024-03-02 06:29:04\",\n" +
" \"before\": {\n" +
" \"REGION_ID\": \"940271349\",\n" +
" \"CUST_ID\": \"0\",\n" +
" \"AMOUNT_FIX\": \"-2224\",\n" +
" \"ONE_ACCT_ITEM_ID\": \"0\",\n" +
" \"BILL_ID\": \"0\",\n" +
" \"PARTY_ROLE_ID\": \"100\",\n" +
" \"AMOUNT\": \"-2224\",\n" +
" \"ITEM_SOURCE_ID\": \"30145122\",\n" +
" \"HAD_INVOICE_AMOUNT\": \"0\",\n" +
" \"DUE_DATE\": \"2024-04-06\",\n" +
" \"ACCT_ID\": \"310000038469672\",\n" +
" \"DUE_TYPE\": \"0\",\n" +
" \"FEE_CYCLE_ID\": \"20240201\",\n" +
" \"ARREAR_DATE\": \"2024-04-06\",\n" +
" \"PROD_INST_ID\": \"420002870683658\",\n" +
" \"PAYMENT_METHOD\": \"0\",\n" +
" \"STATUS_DATE\": \"2024-03-01 09:42:21\",\n" +
" \"PAY_CYCLE_ID\": \"20240301\",\n" +
" \"NO_INVOICE_AMOUNT\": \"0\",\n" +
" \"ACC_NUM\": \"13302956536\",\n" +
" \"PRESENT_AMOUNT\": \"0\",\n" +
" \"GROUP_ID\": \"270002513937230\",\n" +
" \"CREATE_DATE\": \"2024-03-01 09:42:21\",\n" +
" \"CITY_ID\": \"755\",\n" +
" \"ACCT_ITEM_TYPE_ID\": \"16150\",\n" +
" \"PAY_START_DATE\": \"2024-03-03\",\n" +
" \"ACCT_ITEM_ID\": \"27000036749650554\",\n" +
" \"BILLING_CYCLE_ID\": \"20240201\",\n" +
" \"OFFER_INST_ID\": \"420001788058165\",\n" +
" \"STATUS_CD\": \"1\",\n" +
" \"ORI_ACCT_ITEM_ID\": \"0\",\n" +
" \"CUSTOM_ITEM\": \"0000000000000000\"\n" +
" },\n" +
" \"after\": {\n" +
" \"REGION_ID\": \"940271349\",\n" +
" \"CUST_ID\": \"0\",\n" +
" \"AMOUNT_FIX\": \"-2224\",\n" +
" \"ONE_ACCT_ITEM_ID\": \"0\",\n" +
" \"BILL_ID\": \"0\",\n" +
" \"PARTY_ROLE_ID\": \"100\",\n" +
" \"AMOUNT\": \"-2224\",\n" +
" \"ITEM_SOURCE_ID\": \"30145122\",\n" +
" \"HAD_INVOICE_AMOUNT\": \"0\",\n" +
" \"DUE_DATE\": \"2024-04-06\",\n" +
" \"ACCT_ID\": \"310000038469672\",\n" +
" \"DUE_TYPE\": \"0\",\n" +
" \"FEE_CYCLE_ID\": \"20240201\",\n" +
" \"ARREAR_DATE\": \"2024-04-06\",\n" +
" \"PROD_INST_ID\": \"420002870683658\",\n" +
" \"PAYMENT_METHOD\": \"0\",\n" +
" \"STATUS_DATE\": \"2024-03-01 09:42:21\",\n" +
" \"PAY_CYCLE_ID\": \"20240301\",\n" +
" \"NO_INVOICE_AMOUNT\": \"0\",\n" +
" \"ACC_NUM\": \"13302956536\",\n" +
" \"PRESENT_AMOUNT\": \"0\",\n" +
" \"GROUP_ID\": \"270002513937230\",\n" +
" \"CREATE_DATE\": \"2024-03-01 09:42:21\",\n" +
" \"CITY_ID\": \"755\",\n" +
" \"ACCT_ITEM_TYPE_ID\": \"16150\",\n" +
" \"PAY_START_DATE\": \"2024-03-03\",\n" +
" \"ACCT_ITEM_ID\": \"27000036749650554\",\n" +
" \"BILLING_CYCLE_ID\": \"20240201\",\n" +
" \"OFFER_INST_ID\": \"420001788058165\",\n" +
" \"STATUS_CD\": \"1\",\n" +
" \"ORI_ACCT_ITEM_ID\": \"0\",\n" +
" \"CUSTOM_ITEM\": \"1000000000000000\"\n" +
" }\n" +
" }\n" +
"}";
ObjectMapper mapper = new ObjectMapper();
Record record = mapper.readValue(message, Record.class);
logger.info("Record: {}", record);
}
}