📄 datanode.java

📁 分布式全文搜索工具包可以支持集群主要使用java開發比較方便使用
💻 JAVA
字号:
/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements.  See the NOTICE file * distributed with this work for additional information * regarding copyright ownership.  The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License.  You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */package org.apache.hadoop.contrib.dlucene;import java.io.IOException;import java.net.InetSocketAddress;import java.util.concurrent.locks.Lock;import java.util.concurrent.locks.ReentrantLock;import org.apache.hadoop.conf.Configuration;import org.apache.hadoop.contrib.dlucene.data.DataNodeIndexHandler;import org.apache.hadoop.contrib.dlucene.network.Network;import org.apache.hadoop.contrib.dlucene.writable.SearchResults;import org.apache.hadoop.contrib.dlucene.writable.WDocument;import org.apache.hadoop.contrib.dlucene.writable.WQuery;import org.apache.hadoop.contrib.dlucene.writable.WSort;import org.apache.hadoop.contrib.dlucene.writable.WTerm;import org.apache.hadoop.ipc.RPC;import org.apache.hadoop.ipc.RemoteException;import org.apache.hadoop.net.NetUtils;import org.apache.hadoop.util.StringUtils;import org.apache.lucene.analysis.standard.StandardAnalyzer;/** * Implements a datanode that stores Lucene indexes. */public class DataNode extends AbstractNode implements    DataNodeToDataNodeProtocol, ClientToDataNodeProtocol {  /** Interface to access namenode. */  private DataNodeToNameNodeProtocol namenode = null;  /** Data structure storing index information. */  private DataNodeIndexHandler data = null;  /** Status information on this datanode. */  private DataNodeStatus filesystemStatus = null;  /** Controls shared access to data structure. */  private final Lock lock = new ReentrantLock();  /** Thread for handling replication requests. */  private Thread replicationThread = null;  /** The replication object. */  private Runnable replicator = null;  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.AbstractNode#doHeartbeat()   */  protected void doHeartbeat() throws IOException {    HeartbeatResponse hbr = null;    filesystemStatus.updateUsage();    lock.lock();    try {      hbr = namenode.heartbeat(filesystemStatus, data          .getIndexes(), data.getLeases());    } finally {      lock.unlock();    }    if (hbr.getReplicationRequests() != null) {      for (IndexLocation indexToReplicate : hbr.getReplicationRequests()) {        filesystemStatus.addReplicationTask(indexToReplicate);      }    }  }  /**   * Perform replication tasks.   *    * @throws IOException   */  protected void doReplication() throws IOException {    while (shouldRun) {      LOG.info("DataNode.Replicator.doReplication is running on "          + nodeAddr.toString());      try {        if (filesystemStatus.getReplicationTasks().size() > 0) {          IndexLocation indexToReplicate = filesystemStatus              .getNextReplicationTask();          // need to check that index has not already been replicated          data.copyRemoteIndex(indexToReplicate);          filesystemStatus.removeReplicationTask(indexToReplicate);          LOG.info(indexToReplicate + " has finished replicating\n");        }        try {          long sleep = heartBeatInterval;          LOG.info(nodeAddr.toString() + " is alive");          Thread.sleep(sleep);        } catch (InterruptedException ie) {          //         }      } catch (RemoteException re) {        LOG.warn(StringUtils.stringifyException(re));        shutdown();        return;      }    }  }  /**   * Constructor.   *    * @param configuration the Hadoop configuration   * @param dataNodeAddress the address of this node   * @param nameNodeAddress the address of the NameNode   * @param useRamIndex whether to use a RAM based index or not   * @throws IOException   */  protected DataNode(Configuration configuration,      InetSocketAddress dataNodeAddress, InetSocketAddress nameNodeAddress,      boolean useRamIndex) throws IOException {    super(configuration);    this.nodeAddr = dataNodeAddress;    // find the name of this machine    // create the data structure listing indexes on this machine    String rack = configuration.get(Constants.DATANODE_RACK_NAME);    if (rack == null) // exec network script or set the default rack      rack = Network.getNetworkLoc(configuration);    DataNodeConfiguration dataconf = new DataNodeConfiguration(configuration,        dataNodeAddress, rack);    // find the network location of this machine    filesystemStatus = new DataNodeStatus(dataconf, configuration);    // get the interface for calling the namenode    if (nameNodeAddress != null) {      this.namenode = (DataNodeToNameNodeProtocol) RPC          .waitForProxy(DataNodeToNameNodeProtocol.class,              DataNodeToNameNodeProtocol.VERSION_ID, nameNodeAddress,              configuration);    }        data = new DataNodeIndexHandler(dataconf, configuration,        new StandardAnalyzer(), useRamIndex, namenode);    init(dataNodeAddress.getHostName(), dataNodeAddress.getPort(),        configuration, Constants.DATANODE_DEFAULT_NAME);  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.DataNodeToDataNodeProtocol#getFileContent(org.apache.hadoop.dlucene.IndexVersion,   *      java.lang.String)   */  @Override  public byte[] getFileContent(IndexVersion indexVersion, String file)      throws IOException {    Utils.checkArgs(indexVersion, file);    return data.getFileContent(indexVersion, file);  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.protocols.DataNodeToDataNodeProtocol#getFileSet(org.apache.hadoop.dlucene.IndexVersion)   */  @Override  public String[] getFileSet(IndexVersion indexVersion) throws IOException {    Utils.checkArgs(indexVersion);    return data.getFileSet(indexVersion);  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.ipc.VersionedProtocol#getProtocolVersion(java.lang.String,   *      long)   */  @Override  public long getProtocolVersion(String protocol, long clientVersion)      throws IOException {    Utils.checkArgs(protocol);    if (protocol.equals(DataNodeToDataNodeProtocol.class.getName())) {      return DataNodeToDataNodeProtocol.VERSION_ID;    } else if (protocol.equals(ClientToDataNodeProtocol.class.getName())) {      return ClientToDataNodeProtocol.VERSION_ID;    }    throw new IOException("Unknown protocol to name node: " + protocol);  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.ClientToDataNodeProtocol#addDocument(java.lang.String,   *      org.apache.hadoop.dlucene.writable.WDocument)   */  public void addDocument(String index, WDocument doc) throws IOException {    Utils.checkArgs(index, doc);    LOG.debug("Adding document to index " + index);    data.addDocument(index, doc.getDocument());  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.ClientToDataNodeProtocol#addIndex(java.lang.String,   *      org.apache.hadoop.dlucene.IndexLocation)   */  public void addIndex(String index, IndexLocation indexToAdd)      throws IOException {    Utils.checkArgs(index, indexToAdd);    lock.lock();    try {      data.addIndex(index, indexToAdd);    } finally {      lock.unlock();    }  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.protocols.ClientToDataNodeProtocol#commitVersion(java.lang.String)   */  @Override  public IndexVersion commitVersion(String id) throws IOException {    Utils.checkArgs(id);    IndexVersion result = null;    lock.lock();    try {      result = data.commitVersion(id);      doHeartbeat();      numberOfCommits++;      LOG.debug("Committing " + id + " number of commits " + numberOfCommits          + " to version " + result.toString() + " on "          + nodeAddr.getHostName() + ":" + nodeAddr.getPort());    } finally {      lock.unlock();    }    doHeartbeat();    return result;  }  static int numberOfCommits = 0;  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.protocols.ClientToDataNodeProtocol#removeDocuments(java.lang.String,   *      org.apache.lucene.index.Term)   */  @Override  public int removeDocuments(String index, WTerm term) throws IOException {    Utils.checkArgs(index, term);    return data.removeDocuments(index, term.getTerm());  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.protocols.ClientToDataNodeProtocol#search(org.apache.hadoop.dlucene.data.IndexVersion,   *      org.apache.lucene.search.Query, org.apache.lucene.search.Sort, int)   */  @Override  public SearchResults search(IndexVersion i, WQuery query, WSort sort, int n)      throws IOException {    Utils.checkArgs(i, query, sort);    return data.search(i, query.getQuery(), sort.getSort(), n);  }  /*   * (non-Javadoc)   *    * @see org.apache.hadoop.dlucene.protocols.ClientToDataNodeProtocol#addIndex(java.lang.String)   */  @Override  public IndexVersion createIndex(String index) throws IOException {    Utils.checkArgs(index);    IndexVersion result = null;    LOG.debug("Datanode creating index " + index);    lock.lock();    try {      result = data.createIndex(index);    } finally {      lock.unlock();    }    LOG.debug("Datanode created index with result " + result);    doHeartbeat();    return result;  }    public int size(String index) throws IOException {    Utils.checkArgs(index);    return data.size(index);  }  /**   * Startup the node from the command line.   *    * @param args You can use -r to specify the rack that the node is on   */  public static void main(String[] args) {    Configuration conf = new Configuration();    try {      StringUtils.startupShutdownMessage(DataNode.class, args, LOG);      DataNode datanode = null;      if (!parseArguments(args, conf)) {        printUsage(DataNode.class.toString());      } else {        InetSocketAddress dataNodeAddr = NetUtils.createSocketAddr(conf.get(            Constants.DATANODE_DEFAULT_NAME,            Constants.DATANODE_DEFAULT_NAME_VALUE));        InetSocketAddress nameNodeAddr = NetUtils.createSocketAddr(conf.get(            Constants.NAMENODE_DEFAULT_NAME,            Constants.NAMENODE_DEFAULT_NAME_VALUE));        datanode = createNode(conf, dataNodeAddr, nameNodeAddr, false);        if (datanode != null)          datanode.join();      }    } catch (Throwable e) {      e.printStackTrace();      LOG.error(StringUtils.stringifyException(e));      System.exit(-1);    }  }  /**   * Create a node.   *    * @param configuration the Hadoop configuration   * @param dataNodeAddress the address of this node   * @param nameNodeAddress the address of the NameNode   * @param useRamIndex whether to use a RAM based index or not   * @return a DataNode instance   * @throws IOException   */  protected static DataNode createNode(Configuration configuration,      InetSocketAddress dataNodeAddress, InetSocketAddress nameNodeAddress,      boolean useRamIndex) throws IOException {    DataNode dn = new DataNode(configuration, dataNodeAddress, nameNodeAddress,        useRamIndex);    // set up thread for sending heartbeats    dn.initThreads();    return dn;  }  /**   * Initialize the threads.   */  private void initThreads() {    heartBeatClass = new HeartBeater();    heartBeatThread = new Thread(heartBeatClass, DataNode.class.toString()        + ": heartbeat thread");    heartBeatThread.setDaemon(true); // needed for JUnit testing    heartBeatThread.start();    replicator = new Replicator();    replicationThread = new Thread(replicator, DataNode.class.toString()        + ": replication thread");    replicationThread.setDaemon(true);    replicationThread.start();  }  /**   * The class that performs replication.   */  private class Replicator implements Runnable {    /*     * (non-Javadoc)     *      * @see java.lang.Runnable#run()     */    public void run() {      LOG.info("DataNode.Replicator.run is running on " + nodeAddr.toString());      try {        doReplication();      } catch (Exception e) {        LOG.error("Exception: " + StringUtils.stringifyException(e));        shutdown();      }      LOG.info("Finishing DataNode in: " + data);    }  }  /**   * The class that performs heartbeats.   */  private class HeartBeater implements Runnable {    public void run() {      LOG.info("In DataNode.Heartbeater.run is running on "          + nodeAddr.toString());      try {        offerService();      } catch (Exception e) {        LOG.error("Exception: " + StringUtils.stringifyException(e));        shutdown();      }      LOG.info("Finishing DataNode in: " + data);    }  }  /**   * Stop the processes used by the node.   */  public void shutdown() {    LOG.info("Shutting down DataNode");    super.shutdown();    if (replicationThread != null) {      if (replicationThread.isAlive()) {        replicationThread.interrupt();      }    }  }}
💿 文件大小 1079 K
👤 上传用户 ranzige
📂 所属分类软件设计/软件工程
🏷️ 相关标签

#java #分布式 #搜索 #工具包
⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -