| 123456789101112131415161718192021222324252627282930 |
- ; DataX 同步配置:PG public.app_user_cert_info → Hive test.raw_usr_app_user_cert_info_inc_d
- ;
- ; 源 datasource:datasource/postgresql/dev-poyee-xiaoxu.ini
- ; 目标 datasource:datasource/hdfs/prd-hdfs-ha.ini(HA 集群,nameservice1)
- ; 时间锚点:create_time
- ; 敏感字段 user_cert_data / cert_no / cert_real_name 不查(column 不列)
- ; cert_birthday 原样同步未脱敏,正式 raw 上线前补脱敏方案(kb/90 §2.6 后延高优先级)
- ;
- ; 注:key = value 不对齐——parse_ddl 的 grep "path =" 要求字面子串,多空格对齐会破匹配
- [reader]
- dataSource = postgresql/dev-poyee-xiaoxu
- database = hs_sync_data
- table = public.app_user_cert_info
- column = id,user_id,cert_birthday,cert_sex,cert_province,cert_city,version,status,del_flag,create_time,update_time
- columnType =
- where = create_time >= '${start_date}' AND create_time < '${stop_date}'
- splitPk = id
- fetchSize = 1000
- [writer]
- dataSource = hdfs/prd-hdfs-ha
- path = /user/hive/warehouse/test.db/raw_usr_app_user_cert_info_inc_d/dt=${dt}/
- column = id,user_id,cert_birthday,cert_sex,cert_province,cert_city,version,status,del_flag,create_time,update_time
- columnType = id:STRING,user_id:STRING,cert_birthday:STRING,cert_sex:STRING,cert_province:STRING,cert_city:STRING,version:STRING,status:STRING,del_flag:STRING,create_time:STRING,update_time:STRING
- fileType = orc
- fileName = raw_usr_app_user_cert_info_inc_d
- encoding = UTF-8
- writeMode = truncate
- fieldDelimiter = \t
|