TestMissingParity.java example

Explorer
hadoop-20-master
- src
/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.hadoop.raid;

import java.io.BufferedReader;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.FileWriter;
import java.io.PrintStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import java.net.URI;
import java.util.Set;
import java.util.HashSet;
import java.util.ArrayList;
import java.util.Collection;
import java.util.GregorianCalendar;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.List;
import java.util.Properties;
import java.util.Random;
import java.util.zip.CRC32;

import junit.framework.TestCase;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;

import org.apache.hadoop.util.StringUtils;
import org.apache.hadoop.util.ToolRunner;
import org.apache.hadoop.fs.BlockLocation;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.FilterFileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hdfs.MiniDFSCluster;
import org.apache.hadoop.hdfs.protocol.ClientProtocol;
import org.apache.hadoop.hdfs.protocol.LocatedBlock;
import org.apache.hadoop.hdfs.protocol.LocatedBlocks;
import org.apache.hadoop.hdfs.protocol.Block;
import org.apache.hadoop.hdfs.DistributedFileSystem;
import org.apache.hadoop.hdfs.DistributedRaidFileSystem;
import org.apache.hadoop.hdfs.TestRaidDfs;
import org.apache.hadoop.hdfs.DFSUtil;
import org.apache.hadoop.raid.RaidNode;
import org.apache.hadoop.raid.MissingParityFiles;
import org.apache.hadoop.raid.RaidShell;
import org.apache.hadoop.mapred.MiniMRCluster;

public class TestMissingParity extends TestCase {
  
  final static String TEST_DIR = new File(System.getProperty("test.build.data",
      "build/contrib/raid/test/data")).getAbsolutePath();
  final static String CONFIG_FILE = new File(TEST_DIR, 
      "test-raid.xml").getAbsolutePath();
  final static long RELOAD_INTERVAL = 1000;
  final static Log LOG = LogFactory.getLog("org.apache.hadoop.raid.TestRaidNode");
  final static Random rand = new Random();

  Configuration conf;
  String namenode = null;
  String hftp = null;
  MiniDFSCluster dfs = null;
  MiniMRCluster mr = null;
  FileSystem fileSys = null;
  String jobTrackerName = null;
  Path root = null;
  Set<String> allExpectedMissingFiles = null;

  private void createClusters(boolean local) throws Exception {
    if (System.getProperty("hadoop.log.dir") == null) {
      String base = new File(".").getAbsolutePath();
      System.setProperty("hadoop.log.dir", new Path(base).toString() + "/logs");
    }

    new File(TEST_DIR).mkdirs(); // Make sure data directory exists
    conf = new Configuration();
    conf.set("raid.config.file", CONFIG_FILE);
    conf.setBoolean("raid.config.reload", true);
    conf.setLong("raid.config.reload.interval", RELOAD_INTERVAL);

    Utils.loadTestCodecs(conf);

    // scan all policies once every 100 second
    conf.setLong("raid.policy.rescan.interval", 100 * 1000L);

    // the RaidNode does the raiding inline (instead of submitting to map/reduce)
    if (local) {
      conf.set("raid.classname", "org.apache.hadoop.raid.LocalRaidNode");
    } else {
      conf.set("raid.classname", "org.apache.hadoop.raid.DistRaidNode");
    }

    // use local block fixer
    conf.set("raid.blockfix.classname", 
             "org.apache.hadoop.raid.LocalBlockIntegrityMonitor");

    conf.set("raid.server.address", "localhost:0");

    // create a dfs and map-reduce cluster
    final int taskTrackers = 4;
    final int jobTrackerPort = 60050;

    dfs = new MiniDFSCluster(conf, 6, true, null);
    dfs.waitActive();
    fileSys = dfs.getFileSystem();

    Path raidRoot = new Path(Codec.getCodec("xor").parityDirectory);
    root = raidRoot.getParent();
    String file1 = "/p1/f1.txt";
    String file2 = "/p1/f2.txt";
    String file3 = "/p2/f3.txt";
    String file4 = "/p2/f4.txt";
    Path fPath1 = new Path(root + file1);
    Path fPath2 = new Path(root + file2);
    Path fPath3 = new Path(root + file3);
    Path fPath4 = new Path(root + file4);
    Path rPath3 = new Path(raidRoot + file3);
    allExpectedMissingFiles = new HashSet<String>();
    allExpectedMissingFiles.add(fPath2.toUri().getPath());
    allExpectedMissingFiles.add(fPath3.toUri().getPath());
    allExpectedMissingFiles.add(fPath4.toUri().getPath());
    fileSys.create(fPath1, (short)3);
    fileSys.create(fPath2, (short)2);
    fileSys.create(fPath3, (short)2);
    fileSys.create(fPath4, (short)2);
    fileSys.create(rPath3, (short)2);
    namenode = fileSys.getUri().toString();
    mr = new MiniMRCluster(taskTrackers, namenode, 3);
    jobTrackerName = "localhost:" + mr.getJobTrackerPort();
    hftp = "hftp://localhost.localdomain:" + dfs.getNameNodePort();

    FileSystem.setDefaultUri(conf, namenode);
    conf.set("mapred.job.tracker", jobTrackerName);
  }

  /**
   * Test whether MissingParityFiles selects the correct files
   * The files selected should be  /p1/f2.txt /p2/f3.txt and  /p2/f4.txt
   */
  public void testMissingRaidFiles() throws Exception {
    try {
      System.out.println("Test unraided files with < 3 replication");
      createClusters(true);
      MissingParityFiles mf1 = new MissingParityFiles(conf);
      ByteArrayOutputStream bout = new ByteArrayOutputStream();
      PrintStream ps = new PrintStream(bout, true);
      mf1.findMissingParityFiles(root, ps);
      ByteArrayInputStream bin = new ByteArrayInputStream(bout.toByteArray());
      BufferedReader r = new BufferedReader(new InputStreamReader(bin));
      String l = null;
      Set<String> missingFiles = new HashSet<String>();
      while ((l = r.readLine()) != null) {
        missingFiles.add(l);
      }
      System.out.println("Missing files count = " + missingFiles.size());
      assertEquals(allExpectedMissingFiles, missingFiles);
    } catch (Exception e) {
      LOG.info("Test testMissingRaidFiles Exception " + e + StringUtils.stringifyException(e));
      throw e;
    } finally {
      dfs.shutdown();
      mr.shutdown();
    }
  }

  /**
   * Test whether the raid shell is correct integrated with MissingParityFiles
   * Again the files selected should be /p1/f2.txt /p2/f3.txt and /p2/f4.txt
   */
  public void testRaidShell() throws Exception {
    try {
      System.out.println("Test shell unraided files with < 3 replication");
      createClusters(true);
      RaidShell shell = new RaidShell(conf);
      String[] args = new String[2];
      args[0] = "-findMissingParityFiles";
      args[1] = root.toString();
      ToolRunner.run(shell, args);
    } catch (Exception e) {
      LOG.info("Test testRaidShell Exception " + e + StringUtils.stringifyException(e));
      throw e;
    } finally {
      dfs.shutdown();
      mr.shutdown();
    }
  }
}