UnicodeDetector.java example

Explorer

common_utils-master
- baidu_api
  - src
    - main
      - java
        com
        xiongyingqi
        utils
        baidu
        CommonUtil.java
        ip
        IpAddress.java
        vo
        ContentVo.java
        IpAddressVo.java
        Status.java
        map
        AddressMatcher.java
    - test
      - java
        com
        xiongyingqi
        utils
        baidu
        IpAddressTest.java
- common_code
  - src
    - main
      - java
        com
        xiongyingqi
        utils
        code
        CodeAnnotation.java
        CodeBuilder.java
        CodeCondition.java
        CodeHelper.java
        CodeProcessor.java
    - test
      - java
        com
        xiongyingqi
        utils
        code
        CodeBuilderTest.java
- common_helper
  - src
    - main
      - java
        com
        xiongyingqi
        calendar
        CalendarBuilder.java
        captcha
        background
        BackgroundFactory.java
        SingleColorBackgroundFactory.java
        color
        ColorFactory.java
        GradientColorFactory.java
        RandomColorFactory.java
        SingleColorFactory.java
        filter
        AbstractFilterFactory.java
        ConfigurableFilterFactory.java
        FilterFactory.java
        library
        AbstractConvolveImageOp.java
        AbstractImageOp.java
        AbstractTransformImageOp.java
        BlurImageOp.java
        CurvesImageOp.java
        DiffuseImageOp.java
        DoubleRippleImageOp.java
        MarbleImageOp.java
        PerlinNoise.java
        RippleImageOp.java
        SoftenImageOp.java
        WobbleImageOp.java
        predefined
        CurvesRippleFilterFactory.java
        DiffuseRippleFilterFactory.java
        DoubleRippleFilterFactory.java
        MarbleRippleFilterFactory.java
        RippleFilterFactory.java
        WobbleRippleFilterFactory.java
        font
        FontFactory.java
        RandomFontFactory.java
        service
        AbstractCaptchaService.java
        Captcha.java
        CaptchaService.java
        ConfigurableCaptchaService.java
        SimpleCaptchaService.java
        text
        renderer
        AbstractTextRenderer.java
        BestFitTextRenderer.java
        RandomYBestFitTextRenderer.java
        SimpleTextRenderer.java
        TextCharacter.java
        TextRenderer.java
        TextString.java
        utils
        encoder
        EncoderHelper.java
        word
        AdaptiveRandomWordFactory.java
        RandomWordFactory.java
        WordFactory.java
        jackson
        FilterPropertyHandler.java
        annotation
        AllowProperty.java
        IgnoreProperties.java
        IgnoreProperty.java
        helper
        ThreadJacksonMixInHolder.java
        impl
        Jackson1JavassistFilterPropertyHandler.java
        JavassistFilterPropertyHandler.java
        JavassistTest.java
        util
        AlternativeJdkIdGenerator.java
        AnnotationHelper.java
        AntPathMatcher.java
        AopTargetUtils.java
        Assert.java
        AutoPopulatingList.java
        Base64.java
        ByteHelper.java
        CRCHelper.java
        CalendarHelper.java
        ClassHelper.java
        ClassLookupHelper.java
        ClassUtils.java
        ClipBoardHelper.java
        CollectionHelper.java
        CollectionUtils.java
        CommonsLogWriter.java
        ComparatorHelper.java
        CompositeIterator.java
        ConcurrencyThrottleSupport.java
        ConcurrentReferenceHashMap.java
        ConsoleHelper.java
        CosineSimilarAlgorithm.java
        CustomizableThreadCreator.java
        DateHelper.java
        DefaultPropertiesPersister.java
        DigestUtils.java
        DomainHelper.java
        DynamicPassword.java
        EPlatform.java
        EntityHelper.java
        ErrorHandler.java
        FileCopyUtils.java
        FileHelper.java
        FileSystemUtils.java
        FileType.java
        GenericHelper.java
        GetDocumentPathDemo.java
        IdGenerator.java
        IdentityCardHelper.java
        InvalidMimeTypeException.java
        JsonHelper.java
        Judgment.java
        KeyObject.java
        KingrayResource.java
        LinkedCaseInsensitiveMap.java
        LinkedMultiValueMap.java
        Log4jConfigurer.java
        MD5Crypt.java
        MD5Helper.java
        MessageEncryptionHelper.java
        MethodInvoker.java
        MimeType.java
        MimeTypeUtils.java
        MultiValueMap.java
        MyClassLoader.java
        NumberHelper.java
        NumberUtils.java
        ObjectUtils.java
        PackageUtil.java
        PathMatcher.java
        PatternMatchUtils.java
        PhoneNumberAddress.java
        PrintHelper.java
        PropertiesHelper.java
        PropertiesPersister.java
        PropertyPlaceholderHelper.java
        ReflectHelper.java
        ReflectionUtils.java
        RegexHelper.java
        ResourceUtils.java
        RsaUtils.java
        SerializationUtils.java
        SerializeHelper.java
        ServletHelper.java
        SocketUtils.java
        StackTraceHelper.java
        StopWatch.java
        StreamUtils.java
        StringHelper.java
        StringUtil.java
        StringUtils.java
        StringValueResolver.java
        SystemPropertyUtils.java
        Test.java
        ThreadHelper.java
        ThreadPool.java
        ThreadPoolException.java
        TimerHelper.java
        TypeUtils.java
        UnicodeHelper.java
        WeakReferenceMonitor.java
        WinRegisterDemo.java
        WindowsHelper.java
        comparator
        BooleanComparator.java
        ComparableComparator.java
        CompoundComparator.java
        InstanceComparator.java
        InvertibleComparator.java
        NullSafeComparator.java
        StringComparator.java
        package-info.java
        concurrent
        FutureAdapter.java
        ListenableFuture.java
        ListenableFutureAdapter.java
        ListenableFutureCallback.java
        ListenableFutureCallbackRegistry.java
        ListenableFutureTask.java
        package-info.java
        package-info.java
        xml
        AbstractStaxContentHandler.java
        AbstractStaxXMLReader.java
        AbstractXMLReader.java
        AbstractXMLStreamReader.java
        DomContentHandler.java
        DomUtils.java
        SimpleNamespaceContext.java
        SimpleSaxErrorHandler.java
        SimpleTransformErrorListener.java
        StaxEventContentHandler.java
        StaxEventXMLReader.java
        StaxResult.java
        StaxSource.java
        StaxStreamContentHandler.java
        StaxStreamXMLReader.java
        StaxUtils.java
        TransformerUtils.java
        XMLEventStreamReader.java
        XMLEventStreamWriter.java
        XmlValidationModeDetector.java
        package-info.java
    - test
      - java
        AtomicTest.java
        LinkList.java
        LongTest.java
        UserAuthentication.java
        com
        xiongyingqi
        calendar
        CalendarBuilderTest.java
        jackson
        JsonFilterPropertyTest.java
        pojo
        Group.java
        User.java
        util
        AbstractImplements.java
        ClassHelperTest.java
        ConsoleHelperTest.java
        DateHelperTest.java
        EntityHelperTest.java
        FileHelperTest.java
        KeyObjectTest.java
        PrintHelperTest.java
        PropertiesHelperTest.java
        SubClass.java
        TestInterface.java
- common_http
  - src
    - main
      - java
        com
        xiongyingqi
        http
        BuildNameValuePairsHelper.java
        HttpAccess.java
        HttpBuilder.java
    - test
      - java
        Stock.java
- common_log
  - src
    - main
      - java
        com
        xiongyingqi
        Logger.java
  - test
    - java
      - com
        xiongyingqi
        LoggerTest.java
- common_thread
  - src
    - main
      - java
        com
        xiongyingqi
        utils
        thead
        ThreadPool.java
        ThreadPoolException.java
- commons-file
  - src
    - main
      - java
        com
        xiongyingqi
        util
        FileEncode.java
        cpdetector
        io
        parser
        EncodingLexer.java
        EncodingParser.java
        EncodingParserTokenTypes.java
        info
        monitorenter
        cpdetector
        ACmdLineArgsInheritor.java
        CharsetPrinter.java
        CodepageProcessor.java
        io
        ASCIIDetector.java
        AbstractCodepageDetector.java
        ByteOrderMarkDetector.java
        ClassFileFilterIsA.java
        CodepageDetectorProxy.java
        FileFilterExtensions.java
        HTMLCodepageDetector.java
        IClassFileFilter.java
        ICodepageDetector.java
        InputStreamDebug.java
        JChardetFacade.java
        JarArchive.java
        ParsingDetector.java
        UnicodeDetector.java
        UnknownCharset.java
        UnsupportedCharset.java
        parser
        EncodingLexer.java
        EncodingParser.java
        EncodingParserTokenTypes.java
        reflect
        SingletonLoader.java
        test
        ui
        ClassFileChooser.java
        FitAuthoringClient.java
        util
        collections
        ITreeNode.java
        TreeNodeUniqueChildren.java
        ui
        ITableRenderer.java
        StreamTableRenderer.java
        TableRendererHTML.java
        io
        LimitedInputStream.java
        MultiplexingOutputStream.java
        util
        Entry.java
        ExceptionUtil.java
        FileUtil.java
        StringUtil.java
        jargs
        gnu
        CmdLineParser.java
    - test
      - java
        FileHelperTest.java
- commons-ip
  - src
    - main
      - java
        com
        xiongyingqi
        ip
        IpHelper.java
        vo
        IpVo.java
- commons-logic
  - src
    - main
      - java
        com
        xiongyingqi
        logic
        ConditionalOperation.java
        action
        Action.java
        condition
        And.java
        Condition.java
        Logic.java
        Not.java
        Or.java
    - test
      - java
        com
        xiongyingqi
        logic
        ConditionalOperationTest.java
- commons-scan
  - src
    - main
      - java
        com
        xiongyingqi
        util
        ClassLookupHelper.java
        MethodScanner.java
        PackageScanner.java
    - test
      - java
        com
        xiongyingqi
        util
        AbstractImplements.java
        PackageScannerTest.java
        SubClass.java
        TestInterface.java
- commons-spring
  - src
    - main
      - java
        com
        xiongyingqi
        util
        SpringMVCHelper.java
- qrcode
  - src
    - main
      - java
        com
        xiongyingqi
        qrcode
        Profile.java
        QRCode.java
        QRCodeGenerator.java
    - test
      - java
        com
        xiongyingqi
        qrcode
        QRCodeGeneratorTest.java
        QRCodeTest.java
- spring-email
  - src
    - main
      - java
        com
        xiongyingqi
        email
        JavaMailSenderFactory.java
        service
        IEmailService.java
        impl
        EmailService.java
        vo
        AttachmentVo.java
        EmailAccount.java
        EmailVo.java
        InlineImageVo.java
    - test
      - java
        EmailBaseTest.java
        EmailServiceTest.java

/*
 * UnicodeDetector,  <enter purpose here>.
 * Copyright (C) 2005  Achim Westermann, Achim.Westermann@gmx.de
 *
 * ***** BEGIN LICENSE BLOCK *****
 * Version: MPL 1.1/GPL 2.0/LGPL 2.1
 * 
 * The contents of this collection are subject to the Mozilla Public License Version 
 * 1.1 (the "License"); you may not use this file except in compliance with 
 * the License. You may obtain a copy of the License at 
 * http://www.mozilla.org/MPL/
 * 
 * Software distributed under the License is distributed on an "AS IS" basis,
 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
 * for the specific language governing rights and limitations under the
 * License.
 * 
 * The Original Code is the cpDetector code in [sub] packages info.monitorenter and 
 * cpdetector. 
 * 
 * The Initial Developer of the Original Code is
 * Achim Westermann <achim.westermann@gmx.de>.
 * 
 * Portions created by the Initial Developer are Copyright (c) 2007 
 * the Initial Developer. All Rights Reserved.
 * 
 * Contributor(s):
 * 
 * Alternatively, the contents of this file may be used under the terms of
 * either the GNU General Public License Version 2 or later (the "GPL"), or
 * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
 * in which case the provisions of the GPL or the LGPL are applicable instead
 * of those above. If you wish to allow use of your version of this file only
 * under the terms of either the GPL or the LGPL, and not to allow others to
 * use your version of this file under the terms of the MPL, indicate your
 * decision by deleting the provisions above and replace them with the notice
 * and other provisions required by the GPL or the LGPL. If you do not delete
 * the provisions above, a recipient may use your version of this file under
 * the terms of any one of the MPL, the GPL or the LGPL.
 * 
 * ***** END LICENSE BLOCK ***** * 
 *  
 * If you modify or optimize the code in a useful way please let me know.
 * Achim.Westermann@gmx.de
 */
package info.monitorenter.cpdetector.io;

import info.monitorenter.cpdetector.io.AbstractCodepageDetector;
import info.monitorenter.cpdetector.io.ICodepageDetector;
import info.monitorenter.cpdetector.io.UnknownCharset;

import java.io.BufferedInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.net.URL;
import java.nio.charset.Charset;


public class UnicodeDetector extends AbstractCodepageDetector {
    private static ICodepageDetector instance;

    /**
     * Singleton constructor
     */
    private UnicodeDetector() {
        super();
    }

    public static ICodepageDetector getInstance() {
        if (instance == null) {
            instance = new UnicodeDetector();
        }
        return instance;
    }

    /*
     * (non-Javadoc) It is assumed that the inputstream is at the start of the file or String (in order to read the
     * BOM).
     * 
     * @see cpdetector.io.ICodepageDetector#detectCodepage(java.io.InputStream, int)
     * 
     */
    public Charset detectCodepage(InputStream in, int length) throws IOException {
        byte[] bom = new byte[4]; // Get the byte-order mark, if there is one
        in.read(bom, 0, 4);
        // Unicode formats => read BOM
        byte b = (byte)0xEF;
        if (bom[0] == (byte)0x00 && bom[1] == (byte)0x00 && bom[2] == (byte)0xFE
                && bom[2] == (byte)0xFF) // utf-32BE
            return Charset.forName("UTF-32BE");
        if (bom[0] == (byte)0xFF && bom[1] == (byte)0xFE && bom[2] == (byte)0x00
                && bom[2] == (byte)0x00) // utf-32BE
            return Charset.forName("UTF-32LE");
        if (bom[0] == (byte)0xEF && bom[1] == (byte)0xBB && bom[2] == (byte)0xBF) // utf-8
            return Charset.forName("UTF-8");
        if (bom[0] == (byte)0xff && bom[1] == (byte)0xfe) // ucs-2le, ucs-4le, and ucs-16le
            return Charset.forName("UTF-16LE");
        if (bom[0] == (byte)0xfe && bom[1] == (byte)0xff) // utf-16 and ucs-2
            return Charset.forName("UTF-16BE");
        if (bom[0] == (byte)0 && bom[1] == (byte)0 && bom[2] == (byte)0xfe && bom[3] == (byte)0xff) // ucs-4
            return Charset.forName("UCS-4");
        return UnknownCharset.getInstance();
    }

    /**
     * @see info.monitorenter.cpdetector.io.ICodepageDetector#detectCodepage(java.net.URL)
     */
    public Charset detectCodepage(final URL url) throws IOException {
        Charset result;
        BufferedInputStream in = new BufferedInputStream(url.openStream());
        result = this.detectCodepage(in, Integer.MAX_VALUE);
        in.close();
        return result;
    }

}