zoukankan      html  css  js  c++  java
  • Hbase0.96源码之HMaster(二)Hmaster主要循环becomeActiveMaster

    1,Hmaster主循环主要这里主要有:

    1,1 becomeActiveMaster(startupStatus);
    1.2 finishInitialization
    1.3 loop()

      becomeActiveMaster(startupStatus);
      // We are either the active master or we were asked to shutdown
      if (!this.stopped) {
        finishInitialization(startupStatus, false);
        loop();
      }
    

    2。becomeActiveMaster(startupStatus);
    2.1.1首先创建一个ActiveMasterManager,负责watch zk上的事件,这里主要是nodeCreated()。nodeDeleted()

      private boolean becomeActiveMaster(MonitoredTask startupStatus)
      throws InterruptedException {
        // TODO: This is wrong!!!! Should have new servername if we restart ourselves,
        // if we come back to life.
        //创建activeMasterManager对象
        this.activeMasterManager = new ActiveMasterManager(zooKeeper, this.serverName,
            this);
        //注冊activeMasterManager到zk
        this.zooKeeper.registerListener(activeMasterManager);
        stallIfBackupMaster(this.conf, this.activeMasterManager);
    
        // The ClusterStatusTracker is setup before the other
        // ZKBasedSystemTrackers because it's needed by the activeMasterManager
        // to check if the cluster should be shutdown.
        this.clusterStatusTracker = new ClusterStatusTracker(getZooKeeper(), this);
        this.clusterStatusTracker.start();
        return this.activeMasterManager.blockUntilBecomingActiveMaster(startupStatus);
      }
    

    2.1.2 ActiveMasterManager上的事件处理这里不管是create还是都是delete节点都是一样的处
    2.1.2.1 nodeCreated()与nodeDeleted事件处理

      @Override
      public void nodeCreated(String path) {
        handle(path);
      }
    
      @Override
      public void nodeDeleted(String path) {
        if(path.equals(watcher.clusterStateZNode) && !master.isStopped()) {
          clusterShutDown.set(true);
        }
    
        handle(path);
      }
    
      void handle(final String path) {
        if (path.equals(watcher.getMasterAddressZNode()) && !master.isStopped()) {
          handleMasterNodeChange();
        }
      }
    

    2.1.2.2。终于的节点创建和删除处理函数,
    2.1.2.2.1这里无论是创建还是删除节点都是同一处理函数,
    2.1.2.2.2假设/hbase/master节点处在说明已经有active master了,
    2.1.2.2.3另外这个 clusterHasActiveMaster.notifyAll();须要关注下,在后面的堵塞成为master会用到

      private void handleMasterNodeChange() {
        // Watch the node and check if it exists.
        try {
          synchronized(clusterHasActiveMaster) {
            if (ZKUtil.watchAndCheckExists(watcher, watcher.getMasterAddressZNode())) {
              // A master node exists, there is an active master
              LOG.debug("A master is now available");
              clusterHasActiveMaster.set(true);
            } else {
              // Node is no longer there, cluster does not have an active master
              LOG.debug("No master available. Notifying waiting threads");
              clusterHasActiveMaster.set(false);
              // Notify any thread waiting to become the active master
              clusterHasActiveMaster.notifyAll();
            }
          }
        } catch (KeeperException ke) {
          master.abort("Received an unexpected KeeperException, aborting", ke);
        }
      }
    

    2.2堵塞成为master

     boolean blockUntilBecomingActiveMaster(MonitoredTask startupStatus) {
        while (true) {
          startupStatus.setStatus("Trying to register in ZK as active master");
          // Try to become the active master, watch if there is another master.
          // Write out our ServerName as versioned bytes.
          try {
              //backupZNode -->/hbase/backup-masters/sn(hostname,port,startcode)
            String backupZNode =
                ZKUtil.joinZNode(this.watcher.backupMasterAddressesZNode, this.sn.toString());
            // watcher.getMasterAddressZNode()-->/hbase/master
            if (MasterAddressTracker.setMasterAddress(this.watcher,
                this.watcher.getMasterAddressZNode(), this.sn)) {
    
              // If we were a backup master before, delete our ZNode from the backup
              // master directory since we are the active now)
              if (ZKUtil.checkExists(this.watcher, backupZNode) != -1) {
                LOG.info("Deleting ZNode for " + backupZNode + " from backup master directory");
                ZKUtil.deleteNodeFailSilent(this.watcher, backupZNode);
              }
              // Save the znode in a file, this will allow to check if we crash in the launch scripts
              ZNodeClearer.writeMyEphemeralNodeOnDisk(this.sn.toString());
    
              // We are the master, return
              startupStatus.setStatus("Successfully registered as active master.");
              this.clusterHasActiveMaster.set(true);
              LOG.info("Registered Active Master=" + this.sn);
              return true;
            }
    
            // There is another active master running elsewhere or this is a restart
            // and the master ephemeral node has not expired yet.
            this.clusterHasActiveMaster.set(true);
    
            /*
            * Add a ZNode for ourselves in the backup master directory since we are
            * not the active master.
            *
            * If we become the active master later, ActiveMasterManager will delete
            * this node explicitly.  If we crash before then, ZooKeeper will delete
            * this node for us since it is ephemeral.
            */
            LOG.info("Adding ZNode for " + backupZNode + " in backup master directory");
            MasterAddressTracker.setMasterAddress(this.watcher, backupZNode, this.sn);
    
            String msg;
            byte[] bytes =
              ZKUtil.getDataAndWatch(this.watcher, this.watcher.getMasterAddressZNode());
            if (bytes == null) {
              msg = ("A master was detected, but went down before its address " +
                "could be read.  Attempting to become the next active master");
            } else {
              ServerName currentMaster;
              try {
                currentMaster = ServerName.parseFrom(bytes);
              } catch (DeserializationException e) {
                LOG.warn("Failed parse", e);
                // Hopefully next time around we won't fail the parse.  Dangerous.
                continue;
              }
              if (ServerName.isSameHostnameAndPort(currentMaster, this.sn)) {
                msg = ("Current master has this master's address, " +
                  currentMaster + "; master was restarted? Deleting node.");
                // Hurry along the expiration of the znode.
                ZKUtil.deleteNode(this.watcher, this.watcher.getMasterAddressZNode());
    
                // We may have failed to delete the znode at the previous step, but
                //  we delete the file anyway: a second attempt to delete the znode is likely to fail again.
                ZNodeClearer.deleteMyEphemeralNodeOnDisk();
              } else {
                msg = "Another master is the active master, " + currentMaster +
                  "; waiting to become the next active master";
              }
            }
            LOG.info(msg);
            startupStatus.setStatus(msg);
          } catch (KeeperException ke) {
            master.abort("Received an unexpected KeeperException, aborting", ke);
            return false;
          }
          synchronized (this.clusterHasActiveMaster) {
            while (this.clusterHasActiveMaster.get() && !this.master.isStopped()) {
              try {
                this.clusterHasActiveMaster.wait();
              } catch (InterruptedException e) {
                // We expect to be interrupted when a master dies,
                //  will fall out if so
                LOG.debug("Interrupted waiting for master to die", e);
              }
            }
            if (clusterShutDown.get()) {
              this.master.stop(
                "Cluster went down before this master became active");
            }
            if (this.master.isStopped()) {
              return false;
            }
            // there is no active master so we can try to become active master again
          }
        }
      }
    

    2.2.1 创建暂时节点/hbase/master,这里主要看
    2.2.1.1

    MasterAddressTracker.setMasterAddress(this.watcher,
                this.watcher.getMasterAddressZNode(), this.sn)
    

    2.2.1.2

      public static boolean setMasterAddress(final ZooKeeperWatcher zkw,
          final String znode, final ServerName master)
      throws KeeperException {
        return ZKUtil.createEphemeralNodeAndWatch(zkw, znode, toByteArray(master));
      }
    

    2.2.1.3,这里不论创建失败成功都会加入zkw事件watcher,成功则成为master。失败则可能是已经有master存在了

      public static boolean createEphemeralNodeAndWatch(ZooKeeperWatcher zkw,
          String znode, byte [] data)
      throws KeeperException {
        try {
          zkw.getRecoverableZooKeeper().create(znode, data, createACL(zkw, znode),
              CreateMode.EPHEMERAL);
        } catch (KeeperException.NodeExistsException nee) {
          if(!watchAndCheckExists(zkw, znode)) {
            // It did exist but now it doesn't, try again
            return createEphemeralNodeAndWatch(zkw, znode, data);
          }
          return false;
        } catch (InterruptedException e) {
          LOG.info("Interrupted", e);
          Thread.currentThread().interrupt();
        }
        return true;
      }
    

    2.2.2假设失败则堵塞则
    2.2.2.1
    假设失败,说明不是active master,增加backup节点

    LOG.info("Adding ZNode for " + backupZNode + " in backup master directory");
    MasterAddressTracker.setMasterAddress(this.watcher, backupZNode, this.sn);
    

    2.2.2.2 再次从zk获取master 的server地址。与自己比較。假设是则说明已经重新启动过

        byte[] bytes =
              ZKUtil.getDataAndWatch(this.watcher, this.watcher.getMasterAddressZNode());
            if (bytes == null) {
              msg = ("A master was detected, but went down before its address " +
                "could be read.  Attempting to become the next active master");
            } else {
              ServerName currentMaster;
              try {
                currentMaster = ServerName.parseFrom(bytes);
              } catch (DeserializationException e) {
                LOG.warn("Failed parse", e);
                // Hopefully next time around we won't fail the parse.  Dangerous.
                continue;
              }
              if (ServerName.isSameHostnameAndPort(currentMaster, this.sn)) {
                msg = ("Current master has this master's address, " +
                  currentMaster + "; master was restarted? Deleting node.");
                // Hurry along the expiration of the znode.
                ZKUtil.deleteNode(this.watcher, this.watcher.getMasterAddressZNode());
    
                // We may have failed to delete the znode at the previous step, but
                //  we delete the file anyway: a second attempt to delete the znode is likely to fail again.
                ZNodeClearer.deleteMyEphemeralNodeOnDisk();
              } else {
                msg = "Another master is the active master, " + currentMaster +
                  "; waiting to become the next active master";
              }
    

    2.2 堵塞在clusterHasActiveMaster,这里等待知道notify。由ActiveMasterManager(2.1.2)来触发

         synchronized (this.clusterHasActiveMaster) {
            while (this.clusterHasActiveMaster.get() && !this.master.isStopped()) {
              try {
                this.clusterHasActiveMaster.wait();
              } catch (InterruptedException e) {
                // We expect to be interrupted when a master dies,
                //  will fall out if so
                LOG.debug("Interrupted waiting for master to die", e);
              }
            }
            if (clusterShutDown.get()) {
              this.master.stop(
                "Cluster went down before this master became active");
            }
            if (this.master.isStopped()) {
              return false;
            }
            // there is no active master so we can try to become active master again
          }
  • 相关阅读:
    理解margin
    dedecms 时间标签strftime和MyDate
    dede调用img图片
    dedecms中调用制定栏目
    在list_*页面显示出一级栏目下的所有二级栏目
    调用二级、三级栏目
    dedecms二级导航标签调用使用的方法
    学习PHP第一天-----简单登录
    Python程序设计9——数据库编程
    Python程序设计8——网络编程
  • 原文地址:https://www.cnblogs.com/mengfanrong/p/5135987.html
Copyright © 2011-2022 走看看