image.png

    1. vim flume-dir-hdfs.conf
    2. a3.sources = r3
    3. a3.sinks = k3
    4. a3.channels = c3
    5. # Describe/configure the source
    6. #source类型
    7. a3.sources.r3.type = spooldir
    8. #监控的路径
    9. a3.sources.r3.spoolDir = /opt/egg/apache-flume-1.7.0-bin/upload
    10. #定义文件上传完后生成的后缀(linux 的文件上传完会加这个后缀)
    11. a3.sources.r3.fileSuffix = .COMPLETED
    12. #是否有文件头
    13. a3.sources.r3.fileHeader = true
    14. #忽略所有以.tmp结尾的文件,不上传
    15. a3.sources.r3.ignorePattern = ([^ ]*\.tmp)
    16. # Describe the sink
    17. a3.sinks.k3.type = hdfs
    18. a3.sinks.k3.hdfs.path = hdfs://hadoop1:9000/flume/upload/%Y%m%d/%H
    19. #上传文件的前缀
    20. a3.sinks.k3.hdfs.filePrefix = upload-
    21. #是否按照时间滚动文件夹
    22. a3.sinks.k3.hdfs.round = true
    23. #多少时间单位创建一个新的文件夹
    24. a3.sinks.k3.hdfs.roundValue = 1
    25. #重新定义时间单位
    26. a3.sinks.k3.hdfs.roundUnit = hour
    27. #是否使用本地时间戳
    28. a3.sinks.k3.hdfs.useLocalTimeStamp = true
    29. #积攒多少个Event才flush到HDFS一次
    30. a3.sinks.k3.hdfs.batchSize = 100
    31. #设置文件类型,可支持压缩
    32. a3.sinks.k3.hdfs.fileType = DataStream
    33. #多久生成一个新的文件
    34. a3.sinks.k3.hdfs.rollInterval = 60
    35. #设置每个文件的滚动大小大概是128M
    36. a3.sinks.k3.hdfs.rollSize = 134217700
    37. #文件的滚动与Event数量无关
    38. a3.sinks.k3.hdfs.rollCount = 0
    39. # Use a channel which buffers events in memory
    40. a3.channels.c3.type = memory
    41. a3.channels.c3.capacity = 1000
    42. a3.channels.c3.transactionCapacity = 100
    43. # Bind the source and sink to the channel
    44. a3.sources.r3.channels = c3
    45. a3.sinks.k3.channel = c3
    46. 运行flume
    47. bin/flume-ng agent --conf conf/ --name a3 --conf-file job/flume-dir-hdfs.conf
    48. 实验
    49. 往目录touch文件 包括tmp结尾的和txt结尾的
    50. echo "hha" > log3.log
    51. echo "haha" > log4.tmp
    52. drwxr-xr-x - root supergroup 0 2019-09-01 16:19 /flume/upload
    53. drwxr-xr-x - root supergroup 0 2019-09-01 16:19 /flume/upload/20190901
    54. drwxr-xr-x - root supergroup 0 2019-09-01 16:20 /flume/upload/20190901/16
    55. -rw-r--r-- 3 root supergroup 8 2019-09-01 16:20 /flume/upload/20190901/16/upload-.1567325951362