1. 程式人生 > >flume hdfs檔案輸出普通文字 正確行數

flume hdfs檔案輸出普通文字 正確行數

本次除錯flume讀取kafka資料輸出至hdfs總是內容不對,使用fs -cat檢視行數不對,經過測試後發現需要如下配置:

agent.sources = midlog agent.channels = hdfsChannel agent.sinks = hdfsSink

# the source of hdfs agent.sources.midlog.type = org.apache.flume.source.kafka.KafkaSource agent.sources.midlog.channels = hdfsChannel agent.sources.midlog.batchSize = 5000 agent.sources.midlog.batchDurationMillis = 2000 agent.sources.midlog.kafka.bootstrap.servers = master.server.com:9092 agent.sources.midlog.kafka.topics = mid_analog agent.sources.midlog.kafka.consumer.group.id = custom.g.id

# the channel of hdfs agent.channels.hdfsChannel.type = file agent.channels.hdfsChannel.checkpointDir = /data/flume/checkpointDir agent.channels.hdfsChannel.dataDirs = /data/flume/dataDirs

# the sink of hdfs agent.sinks.hdfsSink.type = hdfs agent.sinks.hdfsSink.channel = hdfsChannel

agent.sinks.hdfsSink.hdfs.path = /flumelogs/midlogagent.sinks.hdfsSink.hdfs.fileType = DataStream

agent.sinks.hdfsSink.hdfs.filePrefix = src agent.sinks.hdfsSink.hdfs.round = true agent.sinks.hdfsSink.hdfs.roundValue = 10 agent.sinks.hdfsSink.hdfs.roundUnit = minute

agent.sinks.hdfsSink.hdfs.rollInterval = 0 agent.sinks.hdfsSink.hdfs.rollSize = 0 agent.sinks.hdfsSink.hdfs.rollCount = 1000