ods_usr_traces_apd_d.sql 4.1 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647
  1. -- 作者:tianyu.chu
  2. -- 日期:2026-06-10
  3. -- 工单:(无)
  4. -- 目的:埋点 raw → ods,解析脱敏后 _source JSON 拍平公共属性 + 保留 params_json;按事件日 dt 静态分区写入
  5. -- 状态:[待执行]
  6. -- 备注:ES 按事件日分索引,raw.dt = 事件日,故 dt 静态写 ${dt}(不用动态分区,避开动态覆盖风险);
  7. -- 事件不可变,无双源 union / 无 update_time 去重;es_id 单文件内唯一;时区随集群(东八区)
  8. INSERT OVERWRITE TABLE ods.ods_usr_traces_apd_d PARTITION (dt = '${dt}')
  9. SELECT
  10. es_id AS es_id,
  11. event_name AS event_name,
  12. get_json_object(raw_json, '$.type') AS evt_type,
  13. CAST(CAST(get_json_object(raw_json, '$.time') AS BIGINT) / 1000 AS TIMESTAMP) AS event_time,
  14. CAST(CAST(get_json_object(raw_json, '$.flushTime') AS BIGINT) / 1000 AS TIMESTAMP) AS flush_time,
  15. get_json_object(raw_json, '$.loginId') AS login_id,
  16. get_json_object(raw_json, '$.distinctId') AS distinct_id,
  17. get_json_object(raw_json, '$.anonymousId') AS anonymous_id,
  18. get_json_object(raw_json, '$.properties.userId') AS user_id,
  19. get_json_object(raw_json, '$.properties.userName') AS user_name,
  20. get_json_object(raw_json, '$.properties.userLevel') AS user_lvl,
  21. get_json_object(raw_json, '$.lib.lib') AS lib,
  22. get_json_object(raw_json, '$.lib.libVersion') AS lib_version,
  23. get_json_object(raw_json, '$.lib.libMethod') AS lib_method,
  24. get_json_object(raw_json, '$.properties.appId') AS app_id,
  25. get_json_object(raw_json, '$.properties.appName') AS app_name,
  26. get_json_object(raw_json, '$.properties.appVersion') AS app_version,
  27. get_json_object(raw_json, '$.properties.wgtVersion') AS wgt_version,
  28. get_json_object(raw_json, '$.properties.os') AS os,
  29. get_json_object(raw_json, '$.properties.osVersion') AS os_version,
  30. get_json_object(raw_json, '$.properties.manufacturer') AS manufacturer,
  31. get_json_object(raw_json, '$.properties.brand') AS brand,
  32. get_json_object(raw_json, '$.properties.model') AS model,
  33. get_json_object(raw_json, '$.properties.deviceId') AS device_id,
  34. get_json_object(raw_json, '$.properties.networkType') AS network_type,
  35. get_json_object(raw_json, '$.properties.carrier') AS carrier,
  36. CAST(get_json_object(raw_json, '$.properties.wifi') AS BOOLEAN) AS wifi,
  37. CAST(get_json_object(raw_json, '$.properties.screenWidth') AS BIGINT) AS screen_width,
  38. CAST(get_json_object(raw_json, '$.properties.screenHeight') AS BIGINT) AS screen_height,
  39. CAST(get_json_object(raw_json, '$.properties.timezoneOffset') AS BIGINT) AS timezone_offset,
  40. CAST(get_json_object(raw_json, '$.properties.isFirstDay') AS BOOLEAN) AS is_first_day,
  41. CAST(get_json_object(raw_json, '$.properties.isFirstTime') AS BOOLEAN) AS is_first_time,
  42. CAST(get_json_object(raw_json, '$.properties.resumeFromBackground') AS BOOLEAN) AS resume_from_background,
  43. CAST(get_json_object(raw_json, '$.properties.eventDuration') AS BIGINT) AS event_duration,
  44. get_json_object(raw_json, '$.properties.params') AS params_json
  45. FROM raw.raw_usr_traces_apd_d
  46. WHERE dt = '${dt}';