zoukankan      html  css  js  c++  java
  • [Hadoop][Spark]Cluster and HA

    #!/bin/bash

    # HOST
    echo '10.211.55.101 spark01' >> /etc/hosts
    echo '10.211.55.102 spark02' >> /etc/hosts
    echo '10.211.55.103 spark03' >> /etc/hosts
    echo '10.211.55.101 linux01' >> /etc/hosts
    echo '10.211.55.102 linux02' >> /etc/hosts
    echo '10.211.55.103 linux03' >> /etc/hosts


    # SPARK 国内安装文件下载地址
    # SPARK_WEB_FILE=wget -P /tmp https://mirrors.tuna.tsinghua.edu.cn/apache/spark/spark-2.1.1/spark-2.1.1-bin-hadoop2.7.tgz

    # 是否下载 SPARK 安装文件
    # wget -P /tmp $ZOOKEEPER_WEB_FILE

    # SPARK 安装文件
    # SPARK_INSTALL_FILE=/tmp/spark-2.1.1-bin-hadoop2.7.tgz

    # SPARK 目录
    # SPARK_INSTALL_DIR=/opt/spark-2.1.1-bin-hadoop2.7
    # SPARK_HOME=/opt/spark

    # 安装 SPARK
    tar -C /opt -xf $SPARK_INSTALL_FILE
    ln -s $SPARK_INSTALL_DIR $SPARK_HOME

    # 创建组和用户
    groupadd spark
    useradd -g spark spark -s /sbin/nologin

    # 文件存放目录
    mkdir -p /mnt/spark
    mkdir -p /var/log/spark
    mkdir -p $SPARK_HOME/run
    chown spark:spark -R $SPARK_HOME
    chown spark:spark -R $SPARK_INSTALL_DIR
    chown spark:spark -R $SPARK_HOME

    # /etc/profile
    echo 'JAVA_HOME=/usr/java/default' >> /etc/profile
    echo 'JRE_HOME=$JAVA_HOME/jre' >> /etc/profile
    echo 'CLASSPATH=.:$JAVA_HOME/lib/dt.jar:$JAVA_HOME/lib/tools.jar:$JRE_HOME/lib' >> /etc/profile
    echo 'HADOOP_HOME=/opt/hadoop' >> /etc/profile
    echo 'HADOOP_PREFIX=$HADOOP_HOME' >> /etc/profile
    echo 'HADOOP_CONF_DIR=$HADOOP_HOME/etc/hadoop' >> /etc/profile
    echo 'HADOOP_PID_DIR=$HADOOP_PREFIX/run' >> /etc/profile
    echo 'YARN_PID_DIR=$HADOOP_PREFIX/run' >> /etc/profile
    echo 'SPARK_HOME=/opt/spark' >> /etc/profile
    echo 'SPARK_PID_DIR=/$SPARK_HOME/run' >> /etc/profile
    echo 'PATH=$PATH:$JAVA_HOME/bin:$JRE_HOME/bin:$HADOOP_HOME/bin:$HADOOP_HOME/sbin:$SPARK_HOME/bin:$SPARK_HOME/sbin' >> /etc/profile
    echo 'export JAVA_HOME JRE_HOME CLASSPATH HADOOP_HOME HADOOP_PREFIX HADOOP_CONF_DIR HADOOP_PID_DIR YARN_PID_DIR SPARK_HOME SPARK_PID_DIR PATH' >> /etc/profile

    #创建配置文件
    cat <<EOF | tee /opt/spark/conf/spark-env.sh
    export JAVA_HOME=$JAVA_HOME
    export HADOOP_HOME=$HADOOP_HOME
    export HADOOP_PREFIX=$HADOOP_PREFIX
    export HADOOP_CONF_DIR=$HADOOP_CONF_DIR
    export SPARK_HOME=/opt/spark
    export SPARK_CONF_DIR=$SPARK_HOME/conf
    export SPARK_PID_DIR=$SPARK_PID_DIR
    export SPARK_DAEMON_JAVA_OPTS="-Dspark.deploy.recoveryMode=ZOOKEEPER -Dspark.deploy.zookeeper.url=zookeeper01:2181,zookeeper02:2181,zookeeper03:2181 -Dspark.deploy.zookeeper.dir=/spark"
    EOF

    chmod +x /opt/spark/conf/spark-env.sh

    systemd开机启动 master
    cat <<EOF | tee /usr/lib/systemd/system/spark-master.service
    [Unit]
    Description=Spark Master
    After=syslog.target network.target remote-fs.target nss-lookup.target network-online.target
    Requires=network-online.target

    [Service]
    User=spark
    Group=spark
    Type=forking
    ExecStart=/opt/spark/sbin/start-master.sh
    ExecStop=/opt/spark/sbin/stop-master.sh
    Restart=on-failure

    [Install]
    WantedBy=multi-user.target
    EOF

    systemd开机启动 slave
    cat <<EOF | tee /usr/lib/systemd/system/spark-slave.service
    [Unit]
    Description=Spark Slave
    After=syslog.target network.target remote-fs.target nss-lookup.target network-online.target
    Requires=network-online.target

    [Service]
    User=spark
    Group=spark
    Type=forking
    ExecStart=/opt/spark/sbin/start-slave.sh spark://spark01:7077,spark02:7077,spark03:7077
    ExecStop=/opt/spark/sbin/stop-slave.sh
    Restart=on-failure

    [Install]
    WantedBy=multi-user.target
    EOF

    firewall-cmd --zone=public --add-port=7077/tcp --permanent
    firewall-cmd --zone=public --add-port=6066/tcp --permanent
    firewall-cmd --zone=public --add-port=8080/tcp --permanent
    firewall-cmd --reload

    systemctl stop spark-slave
    systemctl start spark-slave
    systemctl status spark-slave

  • 相关阅读:
    integer比较
    String比较
    StringBuffer的s1.capacity()是多少?
    时间复杂度
    京东面试--总结
    说下Java堆空间结构,及常用的jvm内存分析命令和工具
    linux下jmap,jstat和jstack使用
    jvm 性能调优工具之 jmap
    jstack(查看线程)、jmap(查看内存)和jstat(性能分析)命令
    android小技巧:在activity中实现与绑定的fragment的回调
  • 原文地址:https://www.cnblogs.com/wuzhenzhou/p/6918971.html
Copyright © 2011-2022 走看看