实时数据仓库之客户行为分析
项目背景:
前端收集客户从各个渠道下载、注册、登陆、操作菜单、浏览页面等信息,统一发到日志数据收集服务器,日志收集服务器统一 转发到大数据平台做客户行为分析。
项目目标:
实现与设计:
采集日志格式:
-- -------------------------
-- ods 日志信息
-- Kafka Source
-- -------------------------
CREATE TABLE ods_hxd_log(
sdate varchar ,
cdate varchar ,
ky varchar ,
id varchar ,
ch varchar ,
av varchar ,
sv varchar ,
ui varchar ,
mc varchar ,
im varchar ,
ut varchar ,
qq varchar ,
mf varchar ,
md varchar ,
sd varchar ,
ip varchar ,
op varchar ,
tn varchar ,
cn varchar ,
ov varchar ,
lg varchar ,
sr varchar ,
tz varchar ,
jb varchar ,
si varchar ,
ts varchar ,
pi varchar ,
rf varchar ,
et varchar ,
tags varchar ,
ei varchar ,
ar varchar ,
kv varchar ,
du varchar ,
er varchar ,
ea varchar ,
ext1 varchar ,
ext2 varchar ,
ext3 varchar ,
ext4 varchar ,
ext5 varchar ,
ext6 varchar ,
ext7 varchar ,
ext8 varchar ,
ext9 varchar ,
ext10 varchar ,
ext11 varchar ,
ext12 varchar ,
ext13 varchar ,
ext14 varchar ,
ext15 varchar ,
fm varchar ,
di varchar ,
uid varchar ,
ec varchar
) WITH (
'connector.type' = 'kafka',
'connector.version' = '0.11',
'connector.topic' = 'hxd_log',
'connector.startup-mode' = 'earliest-offset',
--'connector.specific-offsets' = 'partition:0,offset:0;partition:1,offset:0;partition:2,offset:0',
'connector.properties.group.id' = 'hxd_log_group1',
'connector.properties.zookeeper.connect' = 's1:2181,s2:2181,s3:2181',
'connector.properties.bootstrap.servers' = ''m1:9092,m2:9092,s1:9092',
'format.type' = 'json'
);