dolphinscheduler实时数据同步
通过seatunnel实时从MySQL同步数据到另一个MySQL库
前提是来源库必须开启binlog
下面是seatunnel的配置代码
env {
parallelism = 2
job.mode = "STREAMING"
timezone = "Asia/Shanghai"
job.failover.retry_times = 5
job.failover.retry_interval = 10000
}
source {
MySQL-CDC {
result_table_name = "fake"
parallelism = 1
username = "root_DB"
password = "mysql.7334453"
port = 3306
server-id = 58911
table-names = ["ny_syld.aaa"]
base-url = "jdbc:mysql://192.168.1.6:3306/ny_syld?serverTimezone=Asia/Shanghai&useSSL=false"
}
}
sink {
jdbc {
source_table_name = "fake"
url = "jdbc:mysql://192.168.1.6:3306/ny_syld?serverTimezone=Asia/Shanghai&useSSL=false"
driver = "com.mysql.cj.jdbc.Driver"
user = "root_DB"
password = "mysql.7334453"
database = "ny_syld"
table = "aaa_new"
save_mode = "UPSERT"
batch_size = 1
batch_interval = 1000
max_retries = 3
retry_interval = 5000
primary_keys = ["id"]
generate_sink_sql = true
}
}
要实现实时同步需要MySQL-CDC
配置文档
https://seatunnel.apache.org/docs/2.3.3/connector-v2/source/MySQL-CDC
需要注意的是MySQL连接器需要更新到8.0.28以上

lib目录下不要放驱动和其他目录有重复的。



