/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.io.compress.lzma;
import java.io.IOException;
import java.nio.Buffer;
import java.nio.ByteBuffer;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.io.compress.Compressor;
import org.apache.hadoop.util.NativeCodeLoader;
/**
* A {@link Compressor} based on the lzma algorithm.
* http://www.7zip.org
*
*/
public class LzmaCompressor implements Compressor {
private static final Log LOG =
LogFactory.getLog(LzmaCompressor.class.getName());
private static final int DEFAULT_DIRECT_BUFFER_SIZE = 64*1024;
private static final int DEFAULT_COMPRESS_LEVEL = 7;
// HACK - Use this as a global lock in the JNI layer
private static Class clazz = LzmaCompressor.class;
private long stream;
private int level;
private int directBufferSize;
private byte[] userBuf = null;
private int userBufOff = 0, userBufLen = 0;
private Buffer uncompressedDirectBuf = null;
private int uncompressedDirectBufOff = 0, uncompressedDirectBufLen = 0;
private Buffer compressedDirectBuf = null;
private boolean finish, finished;
private static boolean nativeLzmaLoaded = true;
static {
if (NativeCodeLoader.isNativeCodeLoaded()) {
// Initialize the native library
try {
initIDs();
nativeLzmaLoaded = true;
} catch (Throwable t) {
// Ignore failure to load/initialize native-lzma
LOG.error("initIDs() failed in LzmaCompressor..." + t);
LOG.error(t.getCause());
LOG.error(t.getMessage());
nativeLzmaLoaded = false;
}
} else {
LOG.error("Cannot load " + LzmaCompressor.class.getName() +
" without native-hadoop library!");
nativeLzmaLoaded = false;
}
}
/**
* Check if lzma compressors are loaded and initialized.
*
* @return <code>true</code> if lzma compressors are loaded & initialized,
* else <code>false</code>
*/
public static boolean isNativeLzmaLoaded() {
return nativeLzmaLoaded;
}
/**
* Creates a new compressor using the specified level {@link CompressionLevel}.
*
* @param level lzma compression algorithm to use
* @param directBufferSize size of the direct buffer to be used.
*/
public LzmaCompressor(int compress_level, int directBufferSize) {
this.level = compress_level;
this.directBufferSize = directBufferSize;
uncompressedDirectBuf = ByteBuffer.allocateDirect(directBufferSize);
compressedDirectBuf = ByteBuffer.allocateDirect(directBufferSize);
compressedDirectBuf.position(directBufferSize);
stream = init(this.level);
}
/**
* Creates a new compressor with the default compression level.
*/
public LzmaCompressor() {
this(DEFAULT_COMPRESS_LEVEL,
DEFAULT_DIRECT_BUFFER_SIZE);
}
public synchronized void setInput(byte[] b, int off, int len) {
if (b== null) {
throw new NullPointerException();
}
if (off < 0 || len < 0 || off > b.length - len) {
throw new ArrayIndexOutOfBoundsException();
}
this.userBuf = b;
this.userBufOff = off;
this.userBufLen = len;
setInputFromSavedData();
// Reinitialize lzma's output direct buffer
compressedDirectBuf.limit(directBufferSize);
compressedDirectBuf.position(directBufferSize);
}
/**
* If a write would exceed the capacity of the direct buffers, it is set
* aside to be loaded by this function while the compressed data are
* consumed.
*/
synchronized void setInputFromSavedData() {
uncompressedDirectBufOff = 0;
uncompressedDirectBufLen = userBufLen;
if (uncompressedDirectBufLen > directBufferSize) {
uncompressedDirectBufLen = directBufferSize;
}
// Reinitialize lzma's input direct buffer
uncompressedDirectBuf.rewind();
((ByteBuffer)uncompressedDirectBuf).put(userBuf, userBufOff,
uncompressedDirectBufLen);
// Note how much data is being fed to lzma
userBufOff += uncompressedDirectBufLen;
userBufLen -= uncompressedDirectBufLen;
}
public synchronized void setDictionary(byte[] b, int off, int len) {
// nop
}
/** {@inheritDoc} */
public boolean needsInput() {
// Consume remaining compressed data?
if (compressedDirectBuf.remaining() > 0) {
return false;
}
// Check if lzma has consumed all input
if (uncompressedDirectBufLen <= 0) {
// Check if we have consumed all user-input
if (userBufLen <= 0) {
return true;
} else {
setInputFromSavedData();
}
}
return false;
}
public synchronized void finish() {
finish = true;
}
public synchronized boolean finished() {
// Check if 'lzma' says its 'finished' and
// all compressed data has been consumed
return (finish && finished && compressedDirectBuf.remaining() == 0);
}
public synchronized int compress(byte[] b, int off, int len)
throws IOException {
if (b == null) {
throw new NullPointerException();
}
if (off < 0 || len < 0 || off > b.length - len) {
throw new ArrayIndexOutOfBoundsException();
}
int n = 0;
// Check if there is compressed data
n = compressedDirectBuf.remaining();
if (n > 0) {
n = Math.min(n, len);
((ByteBuffer)compressedDirectBuf).get(b, off, n);
return n;
}
// Re-initialize the lzma's output direct buffer
compressedDirectBuf.rewind();
compressedDirectBuf.limit(directBufferSize);
// Compress data
n = compressBytesDirect();
compressedDirectBuf.limit(n);
// Get atmost 'len' bytes
n = Math.min(n, len);
((ByteBuffer)compressedDirectBuf).get(b, off, n);
return n;
}
/**
* Return number of bytes given to this compressor since last reset.
*/
public synchronized long getBytesRead() {
checkStream();
return getBytesRead(stream);
}
/**
* Return number of bytes consumed by callers of compress since last reset.
*/
public synchronized long getBytesWritten() {
checkStream();
return getBytesWritten(stream);
}
public synchronized void reset() {
checkStream();
finish = false;
finished = false;
uncompressedDirectBuf.rewind();
uncompressedDirectBufOff = uncompressedDirectBufLen = 0;
compressedDirectBuf.limit(directBufferSize);
compressedDirectBuf.position(directBufferSize);
userBufOff = userBufLen = 0;
end();
stream = init(this.level);
}
public synchronized void end() {
if (stream != 0) {
end(stream);
stream = 0;
}
}
private void checkStream() {
if (stream == 0)
throw new NullPointerException();
}
private native static void initIDs();
private native static long init(int level);
private native int compressBytesDirect();
private native static long getBytesRead(long strm);
private native static long getBytesWritten(long strm);
private native static void end(long strm);
}