docs: 补充文档

This commit is contained in:
v-zhangjc9
2024-03-22 15:55:05 +08:00
parent 03bb3243bc
commit c4e4b8b3f1

View File

@@ -824,72 +824,109 @@ dws_acct_item_gz
```plantuml ```plantuml
@startuml @startuml
skinparam Dpi 500
title 系统架构图 title 系统架构图
rectangle 外部应用服务 as app entity 外部应用 as external_apps
rectangle Hudi服务 { cloud Hadoop集群 as hadoop {
rectangle Hudi运行模块 as application rectangle Hudi同步任务 as hudi_task
rectangle Hudi运维服务 as service
service -left-> application:启停、运维
} }
application -up-> app:数据提供 rectangle Hudi服务群 as hudi_services
rectangle 汇聚平台 { rectangle 汇聚平台 as odcp
queue 消息队列 as queue
}
queue -up-> application:数据提供 entity 业务平台 as datasource
@enduml
datasource -> odcp:数据采集
odcp -right-> hudi_task:数据加工/推送
hudi_services -u.> hudi_task:Hudi同步任务提交
hudi_task -> external_apps:提供数据
``` ```
```plantuml ```plantuml
@startuml @startuml
'hide circle
title 功能架构图 title 功能架构图
'rectangle 业务应用 as source {
' database 业务数据源
'}
'rectangle 汇聚平台 as odcp {
' rectangle 数据采集 as o1
' rectangle 数据转换 as o2
' rectangle 数据加工 as o3
' rectangle 数据管理 as o4
'
' o1 .[hidden] o2
' o2 .[hidden] o3
' o3 .[hidden] o4
'}
@enduml @enduml
``` ```
```plantuml ```plantuml
@startuml @startuml
'skinparam Linetype ortho
skinparam Dpi 500
title 技术架构图 title 技术架构图
rectangle Yarn集群 as yarn { cloud Yarn集群 as yarn {
rectangle Hudi同步压缩任务 as sc rectangle Hudi同步压缩任务 as sc
rectangle "..." as other
sc .[hidden] other
} }
cloud Yarn集群 as yarn2
database HDFS as hdfs database HDFS as hdfs
database HDFS as hdfs2
database Zookeeper as zk database Zookeeper as zk
rectangle 汇聚平台 { rectangle 汇聚平台 {
database "配置库(MySQL" as db database "MySQL" as db
queue "消息队列(Pulsar集群" as pulsar queue "Pulsar集群" as pulsar
db -up[hidden]- pulsar db -u[hidden]- pulsar
} }
rectangle "Hudi服务Spring Boot" as service { rectangle "Hudi服务" as service {
rectangle 调度服务 as schedule rectangle 调度服务 as schedule
rectangle 查询服务 as query rectangle "查询服务" as query
rectangle web控制台 as web rectangle web控制台 as web
web --> query:查询 web --> query:查询
schedule <--> query:查询 schedule <--> query:调度详情
} }
schedule -up-> yarn:"提交Hudi同步/压缩任务" rectangle 外部应用 as app {
pulsar -up-> sc:数据提供 rectangle Flink as flink
sc --> hdfs rectangle Spark as spark
hdfs --> Flink rectangle Hive as hive
hdfs --> Spark
hdfs --> Hive
pulsar -> query:元数据查询admin flink .[hidden] spark
spark .[hidden] hive
}
schedule -u-> yarn:"提交Hudi同步/压缩任务"
pulsar -u-> sc:数据提供
sc -l-> hdfs:数据输出
hdfs <-u- flink:查询
hdfs <-u- spark:查询
hdfs <-u- hive:查询
pulsar -> query:元数据查询
query <- db: 配置信息 query <- db: 配置信息
query <- zk: 配置信息 query <-- hdfs2: Hudi信息
query <-- zk: 锁信息
query <-- yarn2: 集群信息
@enduml @enduml
``` ```