實時監控目錄下多個新檔案

a3.sources = r3 a3.sinks = k3 a3.channels = c3 # describe/configure the source a3.sources.r3.type = spooldir a3.sources.r3.spooldir = /opt/module/flume- 1.7.0 /upload a3.sources.r3.filesuffix = .completed a3.sources.r3.fileheader = true #忽略所有以.tmp結尾的檔案，不上傳 a3.sources.r3.ignorepattern =([ ^]*\.tmp) # describe the sink a3.sinks.k3.type = hdfs a3.sinks.k3.hdfs.path = hdfs: //hadoop102: 9000 /flume/upload/ %y%m%d/ %h#上傳檔案的字首 a3.sinks.k3.hdfs.fileprefix = upload- #是否按照時間滾動資料夾 a3.sinks.k3.hdfs.round = true #多少時間單位建立乙個新的資料夾 a3.sinks.k3.hdfs.roundvalue = 1#重新定義時間單位 a3.sinks.k3.hdfs.roundunit = hour #是否使用本地時間戳 a3.sinks.k3.hdfs.uselocaltimestamp = true #積攢多少個event才flush到hdfs一次 a3.sinks.k3.hdfs.batchsize = 100#設定檔案型別，可支援壓縮 a3.sinks.k3.hdfs.filetype = datastream #多久生成乙個新的檔案 a3.sinks.k3.hdfs.rollinterval = 60#設定每個檔案的滾動大小大概是128m a3.sinks.k3.hdfs.rollsize = 134217700 #檔案的滾動與event數量無關 a3.sinks.k3.hdfs.rollcount = 0# use a channel which buffers events in memory a3.channels.c3.type = memory a3.channels.c3.capacity = 1000 a3.channels.c3.transactioncapacity = 100# bind the source and sink to the channel a3.sources.r3.channels = c3

a3.sinks.k3.channel = c3

實時監控目錄下多個新檔案

Flume1 9 0實時監控目錄下多個新檔案

python之查詢指定目錄下的最新檔案

監控目錄下的檔案操作與實時同步

實時監控目錄下多個新檔案

Flume1 9 0實時監控目錄下多個新檔案

python之查詢指定目錄下的最新檔案

監控目錄下的檔案操作與實時同步

相關推薦