这里使用Flume只需要创建一个新的flume配置文件就可以了,我这里将配置文件取名为access_hdfs.properties,下面是配置文件内容:
#-----------------access_hdfs.properties---------------#
#--------------------Edit by Cheengvho-----------------#
agent1.sources = src1
agent1.channels = ch1
agent1.sinks = sink1
agent1.sources.src1.interceptors = i1
agent1.sources.src1.interceptors.i1.type = regex_extractor
agent1.sources.src1.interceptors.i1.regex = ^(?:\\n)?(\\d\\d\\d\\d-\\d\\d-\\d\\d\\s\\d\\d:\\d\\d)
agent1.sources.src1.interceptors.i1.serializers = s1
agent1.sources.src1.interceptors.i1.serializers.s1.type = org.apache.flume.interceptor.RegexExtractorInterceptorMillisSerializer
agent1.sources.src1.interceptors.i1.serializers.s1.name = timestamp
agent1.sources.src1.interceptors.i1.serializers.s1.pattern = yyyy-MM-dd HH:mm
agent1.sources.src1.type = spooldir
agent1.sources.src1.spoolDir = /var/log/flume
agent1.sources.src1.channels = ch1
agent1.sinks.sink1.type = hdfs
agent1.sinks.sink1.hdfs.path = /flume/