ChunkEncoder.java example

Explorer

service-framework-master
- src
  - com
    - example
      - controller
        ApplicationController.java
        admin
        TagAdminController.java
        tag
        TagController.java
      - model
        BlogTag.java
        Tag.java
        TagGroup.java
        TagSynonym.java
        TagWiki.java
      - service
        tag
        RemoteDataService.java
        impl
        DefaultRemoteDataService.java
      - util
        CommonUtils.java
  - net
    - csdn
      - AutoGeneration.java
      - ServiceFramwork.java
      - annotation
        AnnotationException.java
        Hint.java
        Scope.java
        Service.java
        Util.java
        association
        ManyToManyHint.java
        NotMapping.java
        filter
        AfterFilter.java
        AroundFilter.java
        BeforeFilter.java
        jpa
        callback
        AfterLoad.java
        AfterSave.java
        AfterUpdate.java
        BeforeDestroy.java
        BeforeSave.java
        BeforeUpdate.java
        EntityCallback.java
        rest
        At.java
        validate
        Validate.java
      - bootstrap
        Application.java
        Bootstrap.java
        MyTranslator.java
        loader
        Loader.java
        impl
        ControllerLoader.java
        LoggerLoader.java
        ModelLoader.java
        ModuelLoader.java
        ServiceLoader.java
        UtilLoader.java
        ValidatorLoader.java
      - common
        Base64.java
        Booleans.java
        Classes.java
        Strings.java
        Type.java
        Unicode.java
        collect
        MapBuilder.java
        Tuple.java
        collections
        WowCollections.java
        WowLists.java
        WowMaps.java
        WowSerializable.java
        io
        Streams.java
        jline
        ANSI.java
        logging
        CSLogger.java
        CSLoggerFactory.java
        Loggers.java
        log4j
        ConsoleAppender.java
        JLinePatternLayout.java
        Log4jCSLogger.java
        Log4jFactory.java
        LogConfigurator.java
        support
        AbstractCSLogger.java
        MessageFormat.java
        network
        NetworkUtils.java
        param
        ParamBinding.java
        path
        PathTrie.java
        Url.java
        property
        PropertyPlaceholder.java
        settings
        ImmutableSettings.java
        InternalSettingsPreparer.java
        NoClassSettingsException.java
        Settings.java
        thread
        ThreadLocals.java
        unit
        ByteSizeUnit.java
        ByteSizeValue.java
        SizeUnit.java
        SizeValue.java
        TimeValue.java
      - enhancer
        AssociatedHelper.java
        BitEnhancer.java
        Enhancer.java
        EnhancerHelper.java
      - env
        Environment.java
      - exception
        ArgumentErrorException.java
        ConfigurationException.java
        ExceptionHandler.java
        FailedToResolveConfigException.java
        ParseException.java
        RecordExistedException.java
        RecordNotFoundException.java
        RenderFinish.java
        SettingsException.java
      - filter
        FilterHelper.java
      - jpa
        JPA.java
        association
        Association.java
        context
        JPAConfig.java
        JPAContext.java
        enhancer
        ClassMethodEnhancer.java
        InstanceMethodEnhancer.java
        JPAEnhancer.java
        PropertyEnhancer.java
        ValidatorEnhancer.java
        exception
        JPAQueryException.java
        hql
        WowCommonParser.java
        WowJoinParser.java
        WowSelectParser.java
        WowWhereParser.java
        model
        GenericModel.java
        JPABase.java
        JPQL.java
        Model.java
        type
        DBInfo.java
        DBType.java
        impl
        MysqlType.java
      - modules
        cache
        CacheModule.java
        RedisClient.java
        compress
        bzip2
        BZip2Constants.java
        CBZip2InputStream.java
        CBZip2OutputStream.java
        CRC.java
        gzip
        GZip.java
        lzf
        BufferRecycler.java
        ChunkEncoder.java
        LZF.java
        LZFChunk.java
        LZFDecoder.java
        LZFEncoder.java
        LZFInputStream.java
        LZFOutputStream.java
        package-info.java
        http
        ApplicationController.java
        DateJsonValueProcessor.java
        DefaultRestRequest.java
        HttpModule.java
        HttpServer.java
        JSONObjectUtils.java
        RestController.java
        RestRequest.java
        RestResponse.java
        RestStatus.java
        RestUtils.java
        ResultFormat.java
        ViewType.java
        support
        HttpStatus.java
        version
        Version.java
        mock
        MockRestRequest.java
        MockRestResponse.java
        persist
        PersistServiceModule.java
        mongodb
        MongoClient.java
        mysql
        DataSourceManager.java
        MysqlClient.java
        scan
        DefaultScanService.java
        ScanModule.java
        ScanService.java
        component
        ClasspathUrlFinder.java
        DirectoryIteratorFactory.java
        FileIterator.java
        FileProtocolIteratorFactory.java
        Filter.java
        InputStreamWrapper.java
        IteratorFactory.java
        JarIterator.java
        StreamIterator.java
        settings
        SettingsModule.java
        threadpool
        DefaultThreadPoolService.java
        ThreadPoolModule.java
        ThreadPoolService.java
        transport
        DefaultHttpTransportService.java
        HttpTransportService.java
        TransportModule.java
      - reflect
        ReflectHelper.java
      - validate
        BaseValidateParse.java
        ValidateHelper.java
        ValidateParse.java
        ValidateResult.java
        impl
        Associated.java
        Format.java
        Length.java
        Numericality.java
        Presence.java
        Uniqueness.java
- test
  - DynamicSuiteRunner.java
  - net
    - csdn
      - jpa
        hql
        WowJoinParserTest.java
        WowWhereParserTest.java
      - junit
        IocTest.java
        JettyTest.java
  - runner
    - DynamicSuite.java
  - test
    - com
      - example
        controller
        TagControllerTest.java
        model
        TagTest.java

/* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this
 * file except in compliance with the License. You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under
 * the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS
 * OF ANY KIND, either express or implied. See the License for the specific language
 * governing permissions and limitations under the License.
 */

package net.csdn.modules.compress.lzf;

import java.io.IOException;
import java.io.OutputStream;

/**
 * Class that handles actual encoding of individual chunks.
 * Resulting chunks can be compressed or non-compressed; compression
 * is only used if it actually reduces chunk size (including overhead
 * of additional header bytes)
 *
 * @author tatu@ning.com
 */
public class ChunkEncoder {
    // Beyond certain point we won't be able to compress; let's use 16 bytes as cut-off
    private static final int MIN_BLOCK_TO_COMPRESS = 16;

    private static final int MIN_HASH_SIZE = 256;

    // Not much point in bigger tables, with 8k window
    private static final int MAX_HASH_SIZE = 16384;

    private static final int MAX_OFF = 1 << 13; // 8k
    private static final int MAX_REF = (1 << 8) + (1 << 3); // 264

    // // Encoding tables etc

    private final BufferRecycler _recycler;

    private int[] _hashTable;

    private final int _hashModulo;

    /**
     * Buffer in which encoded content is stored during processing
     */
    private byte[] _encodeBuffer;

    /**
     * Small buffer passed to LZFChunk, needed for writing chunk header
     */
    private byte[] _headerBuffer;

    /**
     * @param totalLength Total encoded length; used for calculating size
     *                    of hash table to use
     */
    // ES: Added recycler as a parameter so we can control its caching
    public ChunkEncoder(int totalLength, BufferRecycler recycler) {
        int largestChunkLen = Math.max(totalLength, LZFChunk.MAX_CHUNK_LEN);

        int suggestedHashLen = calcHashLen(largestChunkLen);
        _recycler = recycler;
        _hashTable = _recycler.allocEncodingHash(suggestedHashLen);
        _hashModulo = _hashTable.length - 1;
        // Ok, then, what's the worst case output buffer length?
        // length indicator for each 32 literals, so:
        int bufferLen = largestChunkLen + ((largestChunkLen + 31) >> 5);
        _encodeBuffer = _recycler.allocEncodingBuffer(bufferLen);
    }

    /*
    ///////////////////////////////////////////////////////////////////////
    // Public API
    ///////////////////////////////////////////////////////////////////////
     */

    /**
     * Method to close once encoder is no longer in use. Note: after calling
     * this method, further calls to {@link #_encodeChunk} will fail
     */
    public void close() {
        byte[] buf = _encodeBuffer;
        if (buf != null) {
            _encodeBuffer = null;
            _recycler.releaseEncodeBuffer(buf);
        }
        int[] ibuf = _hashTable;
        if (ibuf != null) {
            _hashTable = null;
            _recycler.releaseEncodingHash(ibuf);
        }
    }

    /**
     * Method for compressing (or not) individual chunks
     */
    public LZFChunk encodeChunk(byte[] data, int offset, int len) {
        if (len >= MIN_BLOCK_TO_COMPRESS) {
            /* If we have non-trivial block, and can compress it by at least
             * 2 bytes (since header is 2 bytes longer), let's compress:
             */
            int compLen = tryCompress(data, offset, offset + len, _encodeBuffer, 0);
            if (compLen < (len - 2)) { // nah; just return uncompressed
                return LZFChunk.createCompressed(len, _encodeBuffer, 0, compLen);
            }
        }
        // Otherwise leave uncompressed:
        return LZFChunk.createNonCompressed(data, offset, len);
    }

    /**
     * Method for encoding individual chunk, writing it to given output stream.
     */
    public void encodeAndWriteChunk(byte[] data, int offset, int len, OutputStream out)
            throws IOException {
        byte[] headerBuf = _headerBuffer;
        if (headerBuf == null) {
            _headerBuffer = headerBuf = new byte[LZFChunk.MAX_HEADER_LEN];
        }
        if (len >= MIN_BLOCK_TO_COMPRESS) {
            /* If we have non-trivial block, and can compress it by at least
             * 2 bytes (since header is 2 bytes longer), let's compress:
             */
            int compLen = tryCompress(data, offset, offset + len, _encodeBuffer, 0);
            if (compLen < (len - 2)) { // nah; just return uncompressed
                LZFChunk.writeCompressedHeader(len, compLen, out, headerBuf);
                out.write(_encodeBuffer, 0, compLen);
                return;
            }
        }
        // Otherwise leave uncompressed:
        LZFChunk.writeNonCompressedHeader(len, out, headerBuf);
        out.write(data, offset, len);
    }

    /*
    ///////////////////////////////////////////////////////////////////////
    // Internal methods
    ///////////////////////////////////////////////////////////////////////
     */

    private static int calcHashLen(int chunkSize) {
        // in general try get hash table size of 2x input size
        chunkSize += chunkSize;
        // but no larger than max size:
        if (chunkSize >= MAX_HASH_SIZE) {
            return MAX_HASH_SIZE;
        }
        // otherwise just need to round up to nearest 2x
        int hashLen = MIN_HASH_SIZE;
        while (hashLen < chunkSize) {
            hashLen += hashLen;
        }
        return hashLen;
    }

    private int first(byte[] in, int inPos) {
        return (in[inPos] << 8) + (in[inPos + 1] & 255);
    }

    /*
    private static int next(int v, byte[] in, int inPos) {
        return (v << 8) + (in[inPos + 2] & 255);
    }
*/

    private final int hash(int h) {
        // or 184117; but this seems to give better hashing?
        return ((h * 57321) >> 9) & _hashModulo;
        // original lzf-c.c used this:
        //return (((h ^ (h << 5)) >> (24 - HLOG) - h*5) & _hashModulo;
        // but that didn't seem to provide better matches
    }

    private int tryCompress(byte[] in, int inPos, int inEnd, byte[] out, int outPos) {
        final int[] hashTable = _hashTable;
        ++outPos;
        int hash = first(in, 0);
        int literals = 0;
        inEnd -= 4;
        final int firstPos = inPos; // so that we won't have back references across block boundary

        while (inPos < inEnd) {
            byte p2 = in[inPos + 2];
            // next
            hash = (hash << 8) + (p2 & 255);
            int off = hash(hash);
            int ref = hashTable[off];
            hashTable[off] = inPos;

            // First expected common case: no back-ref (for whatever reason)
            if (ref >= inPos // can't refer forward (i.e. leftovers)
                    || ref < firstPos // or to previous block
                    || (off = inPos - ref - 1) >= MAX_OFF
                    || in[ref + 2] != p2 // must match hash
                    || in[ref + 1] != (byte) (hash >> 8)
                    || in[ref] != (byte) (hash >> 16)) {
                out[outPos++] = in[inPos++];
                literals++;
                if (literals == LZFChunk.MAX_LITERAL) {
                    out[outPos - 33] = (byte) 31; // <= out[outPos - literals - 1] = MAX_LITERAL_MINUS_1;
                    literals = 0;
                    outPos++;
                }
                continue;
            }
            // match
            int maxLen = inEnd - inPos + 2;
            if (maxLen > MAX_REF) {
                maxLen = MAX_REF;
            }
            if (literals == 0) {
                outPos--;
            } else {
                out[outPos - literals - 1] = (byte) (literals - 1);
                literals = 0;
            }
            int len = 3;
            while (len < maxLen && in[ref + len] == in[inPos + len]) {
                len++;
            }
            len -= 2;
            if (len < 7) {
                out[outPos++] = (byte) ((off >> 8) + (len << 5));
            } else {
                out[outPos++] = (byte) ((off >> 8) + (7 << 5));
                out[outPos++] = (byte) (len - 7);
            }
            out[outPos++] = (byte) off;
            outPos++;
            inPos += len;
            hash = first(in, inPos);
            hash = (hash << 8) + (in[inPos + 2] & 255);
            hashTable[hash(hash)] = inPos++;
            hash = (hash << 8) + (in[inPos + 2] & 255); // hash = next(hash, in, inPos);
            hashTable[hash(hash)] = inPos++;
        }
        inEnd += 4;
        // try offlining the tail
        return tryCompressTail(in, inPos, inEnd, out, outPos, literals);
    }

    private int tryCompressTail(byte[] in, int inPos, int inEnd, byte[] out, int outPos,
                                int literals) {
        while (inPos < inEnd) {
            out[outPos++] = in[inPos++];
            literals++;
            if (literals == LZFChunk.MAX_LITERAL) {
                out[outPos - literals - 1] = (byte) (literals - 1);
                literals = 0;
                outPos++;
            }
        }
        out[outPos - literals - 1] = (byte) (literals - 1);
        if (literals == 0) {
            outPos--;
        }
        return outPos;
    }

}