⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 testtextinputformat.java

📁 Hadoop是一个用于运行应用程序在大型集群的廉价硬件设备上的框架。Hadoop为应用程序透明的提供了一组稳定/可靠的接口和数据运动。在 Hadoop中实现了Google的MapReduce算法
💻 JAVA
字号:
/** * Copyright 2005 The Apache Software Foundation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * *     http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */package org.apache.hadoop.mapred;import java.io.*;import java.util.*;import junit.framework.TestCase;import java.util.logging.*;import org.apache.hadoop.fs.*;import org.apache.hadoop.io.*;import org.apache.hadoop.conf.*;public class TestTextInputFormat extends TestCase {  private static final Logger LOG = InputFormatBase.LOG;  private static int MAX_LENGTH = 10000;  private static Configuration conf = new Configuration();    public void testFormat() throws Exception {    JobConf job = new JobConf(conf);    FileSystem fs = FileSystem.getNamed("local", conf);    File dir = new File(System.getProperty("test.build.data",".") + "/mapred");    File file = new File(dir, "test.txt");    Reporter reporter = new Reporter() {        public void setStatus(String status) throws IOException {}      };        int seed = new Random().nextInt();    //LOG.info("seed = "+seed);    Random random = new Random(seed);    fs.delete(dir);    job.setInputDir(dir);    // for a variety of lengths    for (int length = 0; length < MAX_LENGTH;         length+= random.nextInt(MAX_LENGTH/10)+1) {      //LOG.info("creating; entries = " + length);      // create a file with length entries      Writer writer = new OutputStreamWriter(fs.create(file));      try {        for (int i = 0; i < length; i++) {          writer.write(Integer.toString(i));          writer.write("\n");        }      } finally {        writer.close();      }      // try splitting the file in a variety of sizes      InputFormat format = new TextInputFormat();      LongWritable key = new LongWritable();      UTF8 value = new UTF8();      for (int i = 0; i < 3; i++) {        int numSplits = random.nextInt(MAX_LENGTH/20)+1;        //LOG.info("splitting: requesting = " + numSplits);        FileSplit[] splits = format.getSplits(fs, job, numSplits);        //LOG.info("splitting: got =        " + splits.length);        // check each split        BitSet bits = new BitSet(length);        for (int j = 0; j < splits.length; j++) {          RecordReader reader =            format.getRecordReader(fs, splits[j], job, reporter);          try {            int count = 0;            while (reader.next(key, value)) {              int v = Integer.parseInt(value.toString());              //             if (bits.get(v)) {              //               LOG.info("splits["+j+"]="+splits[j]+" : " + v);              //               LOG.info("@"+reader.getPos());              //             }              assertFalse("Key in multiple partitions.", bits.get(v));              bits.set(v);              count++;            }            //LOG.info("splits["+j+"]="+splits[j]+" count=" + count);          } finally {            reader.close();          }        }        assertEquals("Some keys in no partition.", length, bits.cardinality());      }    }  }  public static void main(String[] args) throws Exception {    new TestTextInputFormat().testFormat();  }}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -