zoukankan      html  css  js  c++  java
  • 大数据技术之Flume 配置示例

    大数据技术之Flume 配置示例   1 & 3


    [root@bigdatacloud conf]# cat test1
    a1.sources = r1
    a1.sinks = k1
    a1.channels = c1

    # Describe/configure the source
    a1.sources.r1.type = netcat
    a1.sources.r1.bind =0.0.0.0
    a1.sources.r1.port = 44444

    # Describe the sink
    a1.sinks.k1.type = logger

    # Use a channel which buffers events in memory
    a1.channels.c1.type = memory
    a1.channels.c1.capacity = 1000
    a1.channels.c1.transactionCapacity = 100

    # Bind the source and sink to the channel
    a1.sources.r1.channels = c1
    a1.sinks.k1.channel = c1


    ====================

    [root@bigdatacloud conf]# cat test2
    a1.sources=r1
    a1.sinks=k1
    a1.channels=c1

    # Describe/configure the source
    a1.sources.r1.type=spooldir
    a1.sources.r1.spoolDir=/opt/sqooldir

    # Describe the sink
    a1.sinks.k1.type=avro
    a1.sinks.k1.hostname=bigdatastorm
    a1.sinks.k1.port=44444

    # Use a channel which buffers events in memory
    a1.channels.c1.type=memory
    a1.channels.c1.capacity=1000
    a1.channels.c1.transactionCapacity=100

    # Bind the source and sink to the channel
    a1.sources.r1.channels=c1
    a1.sinks.k1.channel=c1

    =========================

    [root@bigdatacloud conf]# cat test3
    a1.sources=r1
    a1.sinks=k1
    a1.channels=c1

    # Describe/configure the source
    a1.sources.r1.type=avro
    a1.sources.r1.bind=0.0.0.0
    a1.sources.r1.port=44444

    # Describe the sink
    a1.sinks.k1.type=hdfs
    a1.sinks.k1.hdfs.path=hdfs://mycluster/flume/data/%y-%m-%d
    a1.sinks.k1.hdfs.rollInterval=0
    a1.sinks.k1.hdfs.rollCount=0
    a1.sinks.k1.hdfs.rollSize=10240000
    a1.sinks.k1.hdfs.fileType=DataStream
    a1.sinks.k1.hdfs.idleTimeout=5
    a1.sinks.k1.hdfs.useLocalTimeStamp=true
    a1.sinks.k1.hdfs.callTimeout=10000

    #a1.sinks.k1.type=hdfs
    #a1.sinks.k1.type=hdfs
    #a1.sinks.k1.type=hdfs

    # Use a channel which buffers events in memory
    a1.channels.c1.type=memory
    a1.channels.c1.capacity=1000
    a1.channels.c1.transactionCapacity=100

    # Bind the source and sink to the channel
    a1.sources.r1.channels=c1
    a1.sinks.k1.channel=c1

    ====================

    [root@bigdatacloud conf]# cat getnginxlog
    a1.sources=r1
    a1.sinks=k1
    a1.channels=c1

    # Describe/configure the source
    #a1.sources.r1.type=avro
    a1.sources.r1.type=exec
    #a1.sources.r1.bind=0.0.0.0
    #a1.sources.r1.port=44444
    a1.sources.r1.command=tail -F /opt/first_project/data/access.log

    # Describe the sink
    a1.sinks.k1.type=hdfs
    a1.sinks.k1.hdfs.path=hdfs://mycluster/flume/data1/%y-%m-%d
    a1.sinks.k1.hdfs.rollInterval=0
    a1.sinks.k1.hdfs.rollCount=0
    a1.sinks.k1.hdfs.rollSize=10240000
    a1.sinks.k1.hdfs.fileType=DataStream
    a1.sinks.k1.hdfs.idleTimeout=5
    a1.sinks.k1.hdfs.useLocalTimeStamp=true
    a1.sinks.k1.hdfs.callTimeout=10000

    #a1.sinks.k1.type=hdfs
    #a1.sinks.k1.type=hdfs
    #a1.sinks.k1.type=hdfs

    # Use a channel which buffers events in memory
    a1.channels.c1.type=memory
    a1.channels.c1.capacity=1000
    a1.channels.c1.transactionCapacity=100

    # Bind the source and sink to the channel
    a1.sources.r1.channels=c1
    a1.sinks.k1.channel=c1


  • 相关阅读:
    使用迭代器模式批量获得数据(C#实现)
    如何从技术上预防抢票软件刷屏
    如何用Tesseract做日文OCR(c#实现)
    我的.net开发百宝箱
    程序员必备基础:Git 命令全方位学习
    Java 异常处理的十个建议
    50道Java集合经典面试题(收藏版)
    记一次接口性能优化实践总结:优化接口性能的八个建议
    100道MySQL数据库经典面试题解析(收藏版)
    800+Java后端经典面试题,希望你找到自己理想的Offer呀~
  • 原文地址:https://www.cnblogs.com/TendToBigData/p/10501492.html
Copyright © 2011-2022 走看看