docs: 补充文档

This commit is contained in:
v-zhangjc9
2024-03-22 15:55:05 +08:00
parent 03bb3243bc
commit c4e4b8b3f1

View File

@@ -824,72 +824,109 @@ dws_acct_item_gz
```plantuml
@startuml
skinparam Dpi 500
title 系统架构图
rectangle 外部应用服务 as app
entity 外部应用 as external_apps
rectangle Hudi服务 {
rectangle Hudi运行模块 as application
rectangle Hudi运维服务 as service
service -left-> application:启停、运维
cloud Hadoop集群 as hadoop {
rectangle Hudi同步任务 as hudi_task
}
application -up-> app:数据提供
rectangle Hudi服务群 as hudi_services
rectangle 汇聚平台 {
queue 消息队列 as queue
}
rectangle 汇聚平台 as odcp
queue -up-> application:数据提供
@enduml
entity 业务平台 as datasource
datasource -> odcp:数据采集
odcp -right-> hudi_task:数据加工/推送
hudi_services -u.> hudi_task:Hudi同步任务提交
hudi_task -> external_apps:提供数据
```
```plantuml
@startuml
'hide circle
title 功能架构图
'rectangle 业务应用 as source {
' database 业务数据源
'}
'rectangle 汇聚平台 as odcp {
' rectangle 数据采集 as o1
' rectangle 数据转换 as o2
' rectangle 数据加工 as o3
' rectangle 数据管理 as o4
'
' o1 .[hidden] o2
' o2 .[hidden] o3
' o3 .[hidden] o4
'}
@enduml
```
```plantuml
@startuml
'skinparam Linetype ortho
skinparam Dpi 500
title 技术架构图
rectangle Yarn集群 as yarn {
cloud Yarn集群 as yarn {
rectangle Hudi同步压缩任务 as sc
rectangle "..." as other
sc .[hidden] other
}
cloud Yarn集群 as yarn2
database HDFS as hdfs
database HDFS as hdfs2
database Zookeeper as zk
rectangle 汇聚平台 {
database "配置库(MySQL" as db
queue "消息队列(Pulsar集群" as pulsar
database "MySQL" as db
queue "Pulsar集群" as pulsar
db -up[hidden]- pulsar
db -u[hidden]- pulsar
}
rectangle "Hudi服务Spring Boot" as service {
rectangle "Hudi服务" as service {
rectangle 调度服务 as schedule
rectangle 查询服务 as query
rectangle "查询服务" as query
rectangle web控制台 as web
web --> query:查询
schedule <--> query:查询
schedule <--> query:调度详情
}
schedule -up-> yarn:"提交Hudi同步/压缩任务"
pulsar -up-> sc:数据提供
sc --> hdfs
hdfs --> Flink
hdfs --> Spark
hdfs --> Hive
rectangle 外部应用 as app {
rectangle Flink as flink
rectangle Spark as spark
rectangle Hive as hive
pulsar -> query:元数据查询admin
flink .[hidden] spark
spark .[hidden] hive
}
schedule -u-> yarn:"提交Hudi同步/压缩任务"
pulsar -u-> sc:数据提供
sc -l-> hdfs:数据输出
hdfs <-u- flink:查询
hdfs <-u- spark:查询
hdfs <-u- hive:查询
pulsar -> query:元数据查询
query <- db: 配置信息
query <- zk: 配置信息
query <-- hdfs2: Hudi信息
query <-- zk: 锁信息
query <-- yarn2: 集群信息
@enduml
```