/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.hadoop.hdfs; import java.io.BufferedReader; import java.io.File; import java.io.FileReader; import java.io.IOException; import java.net.InetSocketAddress; import java.util.Random; import java.util.Arrays; import org.apache.commons.logging.impl.Log4JLogger; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.BlockLocation; import org.apache.hadoop.fs.FSDataInputStream; import org.apache.hadoop.fs.FSDataOutputStream; import org.apache.hadoop.fs.FileStatus; import org.apache.hadoop.fs.FileSystem; import org.apache.hadoop.fs.Path; import org.apache.hadoop.hdfs.protocol.Block; import org.apache.hadoop.hdfs.protocol.DatanodeInfo; import org.apache.hadoop.hdfs.protocol.FSConstants; import org.apache.hadoop.hdfs.protocol.LocatedBlock; import org.apache.hadoop.hdfs.protocol.LocatedBlocks; import org.apache.hadoop.hdfs.server.datanode.DataNode; import org.apache.hadoop.hdfs.server.datanode.FSDataset; import org.apache.hadoop.hdfs.server.datanode.SimulatedFSDataset; import org.apache.hadoop.hdfs.server.namenode.FSNamesystem; import org.apache.hadoop.hdfs.server.namenode.LeaseManager; import org.apache.hadoop.io.IOUtils; import org.apache.log4j.Level; import org.junit.Test; /** * This class tests that blocks can be larger than 2GB */ public class TestLargeBlock extends junit.framework.TestCase { static final String DIR = "/" + TestLargeBlock.class.getSimpleName() + "/"; { // ((Log4JLogger)DataNode.LOG).getLogger().setLevel(Level.ALL); // ((Log4JLogger)LeaseManager.LOG).getLogger().setLevel(Level.ALL); // ((Log4JLogger)FSNamesystem.LOG).getLogger().setLevel(Level.ALL); // ((Log4JLogger)DFSClient.LOG).getLogger().setLevel(Level.ALL); } static final boolean verifyData = true; // should we verify the data read back from the file? (slow) static final byte[] pattern = { 'D', 'E', 'A', 'D', 'B', 'E', 'E', 'F'}; static final boolean simulatedStorage = false; // creates a file static FSDataOutputStream createFile(FileSystem fileSys, Path name, int repl, final long blockSize) throws IOException { FSDataOutputStream stm = fileSys.create(name, true, fileSys.getConf().getInt("io.file.buffer.size", 4096), (short)repl, blockSize); System.out.println("createFile: Created " + name + " with " + repl + " replica."); return stm; } /** * Writes pattern to file */ static void writeFile(FSDataOutputStream stm, final long fileSize) throws IOException { final int writeSize = pattern.length * 8 * 1024 * 1024; // write in chunks of 64 MB final int writeCount = (int) ((fileSize / ((long) writeSize)) + ((fileSize % ((long) writeSize) == 0L) ? 0L : 1L)); if (writeSize > Integer.MAX_VALUE) { throw new IOException("A single write is too large " + writeSize); } long bytesToWrite = fileSize; byte[] b = new byte[writeSize]; // initialize buffer for (int j = 0; j < writeSize; j++) { b[j] = pattern[j % pattern.length]; } int i = 0; while (bytesToWrite > 0) { int thiswrite = (int) Math.min(writeSize, bytesToWrite); // how many bytes we are writing in this iteration stm.write(b, 0, thiswrite); // System.out.println("Wrote[" + i + "/" + writeCount + "] " + thiswrite + " bytes."); bytesToWrite -= thiswrite; i++; } } /** * Reads from file and makes sure that it matches the pattern */ static void checkFullFile(FileSystem fs, Path name, final long fileSize) throws IOException { final int readSize = pattern.length * 16 * 1024 * 1024; // read in chunks of 128 MB final int readCount = (int) ((fileSize / ((long) readSize)) + ((fileSize % ((long) readSize) == 0L) ? 0L : 1L)); if (readSize > Integer.MAX_VALUE) { throw new IOException("A single read is too large " + readSize); } byte[] b = new byte[readSize]; long bytesToRead = fileSize; byte[] compb = new byte[readSize]; // buffer with correct data for comparison if (verifyData) { // initialize compare buffer for (int j = 0; j < readSize; j++) { compb[j] = pattern[j % pattern.length]; } } FSDataInputStream stm = fs.open(name); int i = 0; while (bytesToRead > 0) { int thisread = (int) Math.min(readSize, bytesToRead); // how many bytes we are reading in this iteration stm.readFully(b, 0, thisread); if (verifyData) { // verify data read if (thisread == readSize) { assertTrue("file corrupted at or after byte " + (fileSize - bytesToRead), Arrays.equals(b, compb)); } else { // b was only partially filled by last read for (int k = 0; k < thisread; k++) { assertTrue("file corrupted at or after byte " + (fileSize - bytesToRead), b[k] == compb[k]); } } } // System.out.println("Read[" + i + "/" + readCount + "] " + thisread + " bytes."); bytesToRead -= thisread; i++; } stm.close(); } /** * Test for block size of 2GB + 512B */ @Test public void testLargeBlockSize() throws IOException { final long blockSize = 2L * 1024L * 1024L * 1024L + 512L; // 2GB + 512B runTest(blockSize); } /** * Test that we can write to and read from large blocks */ public void runTest(final long blockSize) throws IOException { // write a file that is slightly larger than 1 block final long fileSize = blockSize + 1L; Configuration conf = new Configuration(); if (simulatedStorage) { conf.setBoolean(SimulatedFSDataset.CONFIG_PROPERTY_SIMULATED, true); } MiniDFSCluster cluster = new MiniDFSCluster(conf, 1, true, null); FileSystem fs = cluster.getFileSystem(); try { // create a new file in test data directory Path file1 = new Path(System.getProperty("test.build.data") + "/" + Long.toString(blockSize) + ".dat"); FSDataOutputStream stm = createFile(fs, file1, 1, blockSize); System.out.println("File " + file1 + " created with file size " + fileSize + " blocksize " + blockSize); // verify that file exists in FS namespace assertTrue(file1 + " should be a file", fs.getFileStatus(file1).isDir() == false); // write to file writeFile(stm, fileSize); System.out.println("File " + file1 + " written to."); // close file stm.close(); System.out.println("File " + file1 + " closed."); // Make sure a client can read it checkFullFile(fs, file1, fileSize); // verify that file size has changed long len = fs.getFileStatus(file1).getLen(); assertTrue(file1 + " should be of size " + fileSize + " but found to be of size " + len, len == fileSize); } finally { cluster.shutdown(); } } }