PDFFontEncoding.java example

Explorer

PDFrenderer-master
- src
  - com
    - sun
      - pdfview
        BaseWatchable.java
        ByteBufferInputStream.java
        Cache.java
        Configuration.java
        HexDump.java
        Identity8BitCharsetEncoder.java
        ImageInfo.java
        NameTree.java
        OutlineNode.java
        PDFCmd.java
        PDFDebugger.java
        PDFDestination.java
        PDFDocCharsetEncoder.java
        PDFErrorHandler.java
        PDFFile.java
        PDFImage.java
        PDFImageParseException.java
        PDFObject.java
        PDFPage.java
        PDFPaint.java
        PDFParseException.java
        PDFParser.java
        PDFRenderer.java
        PDFShapeCmd.java
        PDFStringUtil.java
        PDFTextFormat.java
        PDFXref.java
        PdfSubByteSampleModel.java
        RefImage.java
        Watchable.java
        action
        GoToAction.java
        GoToEAction.java
        GoToRAction.java
        LaunchAction.java
        PDFAction.java
        PdfObjectParseUtil.java
        UriAction.java
        annotation
        FreetextAnnotation.java
        LinkAnnotation.java
        PDFAnnotation.java
        StampAnnotation.java
        WidgetAnnotation.java
        colorspace
        AltColorSpace.java
        AlternateColorSpace.java
        CMYKColorSpace.java
        CalGrayColor.java
        CalRGBColor.java
        IndexedColor.java
        LabColor.java
        MaskColorSpace.java
        PDFColorSpace.java
        PatternSpace.java
        YCCKColorSpace.java
        decode
        ASCII85Decode.java
        ASCIIHexDecode.java
        CCITTFaxDecode.java
        CCITTFaxDecoder.java
        DCTDecode.java
        FlateDecode.java
        ImageDataDecoder.java
        JBig2Decode.java
        JPXDecode.java
        LZWDecode.java
        PDFDecoder.java
        PNGPredictor.java
        Predictor.java
        RunLengthDecode.java
        TIFFPredictor.java
        decrypt
        CryptFilterDecrypter.java
        EncryptionUnsupportedByPlatformException.java
        EncryptionUnsupportedByProductException.java
        IdentityDecrypter.java
        PDFAuthenticationFailureException.java
        PDFDecrypter.java
        PDFDecrypterFactory.java
        PDFPassword.java
        StandardDecrypter.java
        UnsupportedEncryptionException.java
        font
        BuiltinFont.java
        CIDFontType0.java
        CIDFontType2.java
        FlPoint.java
        FontSupport.java
        NativeFont.java
        OutlineFont.java
        PDFFont.java
        PDFFontDescriptor.java
        PDFFontEncoding.java
        PDFGlyph.java
        TTFFont.java
        Type0Font.java
        Type1CFont.java
        Type1Font.java
        Type3Font.java
        cid
        PDFCMap.java
        ToUnicodeMap.java
        ttf
        AdobeGlyphList.java
        CMap.java
        CMapFormat0.java
        CMapFormat4.java
        CMapFormat6.java
        CmapTable.java
        Glyf.java
        GlyfCompound.java
        GlyfSimple.java
        GlyfTable.java
        HeadTable.java
        HheaTable.java
        HmtxTable.java
        LocaTable.java
        MaxpTable.java
        NameTable.java
        PostTable.java
        TrueTypeFont.java
        TrueTypeTable.java
        function
        FunctionType0.java
        FunctionType2.java
        FunctionType3.java
        FunctionType4.java
        PDFFunction.java
        postscript
        PostScriptParser.java
        operation
        Abs.java
        Add.java
        And.java
        Atan.java
        Bitshift.java
        Ceiling.java
        Copy.java
        Cvi.java
        Cvr.java
        Div.java
        Dup.java
        Eq.java
        Exch.java
        Exp.java
        Expression.java
        False.java
        Floor.java
        Ge.java
        Gt.java
        Idiv.java
        If.java
        IfElse.java
        Index.java
        Le.java
        Ln.java
        Log.java
        Lt.java
        Mod.java
        Mul.java
        Ne.java
        Neg.java
        Not.java
        OperationSet.java
        Or.java
        Pop.java
        PostScriptOperation.java
        PushAsNumber.java
        Roll.java
        Round.java
        Sin.java
        Sqrt.java
        Sub.java
        True.java
        Truncate.java
        Xor.java
        pattern
        DummyShader.java
        PDFPattern.java
        PDFShader.java
        PatternType1.java
        PatternType2.java
        ShaderType2.java
        ShaderType3.java
- test
  - src
    - com
      - sun
        pdfview
        function
        postscript
        PostScriptOPTest.java

/*
 * Copyright 2004 Sun Microsystems, Inc., 4150 Network Circle,
 * Santa Clara, California 95054, U.S.A. All rights reserved.
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 * 
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 * 
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 */
package com.sun.pdfview.font;

import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

import com.sun.pdfview.PDFObject;
import com.sun.pdfview.font.cid.PDFCMap;

/**
 * The PDFFont encoding encapsulates the mapping from character codes
 * in the PDF document to glyphs of the font.
 *
 * Encodings take two basic forms.  For Type1, TrueType, and Type3 fonts,
 * the encoding maps from character codes to Strings, which represent the
 * glyphs of the font.  For Type0 fonts, the mapping is a CMap which maps
 * character codes to characters in one of many descendant fonts.
 *
 * Note that the data in the PDF might be ASCII characters (bytes) or it might
 * be a multi-byte format such as unicode.  For now we will assume all
 * glyph ids fit into at most the two bytes of a character.
 */
public class PDFFontEncoding {

    /** Encoding types */
    private static final int TYPE_ENCODING = 0;
    private static final int TYPE_CMAP = 1;
    /** 
     * the base encoding (an array of integers which can be mapped to names
     * using the methods on FontSupport
     */
    private int[] baseEncoding;
    /** any differences from the base encoding */
    private Map<Character,String> differences;
    /**
     * a CMap for fonts encoded by CMap
     */
    private PDFCMap cmap;
    /**
     * the type of this encoding (encoding or CMap)
     */
    private int type;
    
    public PDFFontEncoding(PDFCMap cmap) {
    	super();
    	this.type = TYPE_CMAP;
    	this.cmap = cmap;
    }

    /** Creates a new instance of PDFFontEncoding */
    public PDFFontEncoding(String fontType, PDFObject encoding)
            throws IOException {
        if (encoding.getType() == PDFObject.NAME) {
            // if the encoding is a String, it is the name of an encoding
            // or the name of a CMap, depending on the type of the font
            if (fontType.equals("Type0")) {
                this.type = TYPE_CMAP;
                this.cmap = PDFCMap.getCMap(encoding.getStringValue());
            } else {
                this.type = TYPE_ENCODING;

                this.differences = new HashMap<Character,String>();
                this.baseEncoding = this.getBaseEncoding(encoding.getStringValue());
            }
        } else {
            // loook at the "Type" entry of the encoding to determine the type
            String typeStr = encoding.getDictRef("Type").getStringValue();

            if (typeStr.equals("Encoding")) {
                // it is an encoding
                this.type = TYPE_ENCODING;
                parseEncoding(encoding);
            } else if (typeStr.equals("CMap")) {
                // it is a CMap
                this.type = TYPE_CMAP;
                this.cmap = PDFCMap.getCMap(encoding);
            } else {
                throw new IllegalArgumentException("Uknown encoding type: " + this.type);
            }
        }
    }

    /** Get the glyphs associated with a given String */
    public List<PDFGlyph> getGlyphs(PDFFont font, String text) {
        List<PDFGlyph> outList = new ArrayList<PDFGlyph>(text.length());

        // go character by character through the text
        char[] arry = text.toCharArray();
        for (int i = 0; i < arry.length; i++) {
            switch (this.type) {
                case TYPE_ENCODING:
                    outList.add(getGlyphFromEncoding(font, arry[i]));
                    break;
                case TYPE_CMAP:
                    // 2 bytes -> 1 character in a CMap
                    char c = (char) ((arry[i] & 0xff) << 8);
                    if (i < arry.length - 1) {
                        c |= (char) (arry[++i] & 0xff);
                    }
                    outList.add(getGlyphFromCMap(font, c));
                    break;
            }
        }

        return outList;
    }

    /**
     * Get a glyph from an encoding, given a font and character
     */
    private PDFGlyph getGlyphFromEncoding(PDFFont font, char src) {
        String charName = null;

        // only deal with one byte of source
        src &= 0xff;

        // see if this character is in the differences list
        if (this.differences.containsKey(Character.valueOf(src))) {
            charName = this.differences.get(Character.valueOf(src));
        } else if (this.baseEncoding != null) {
            // get the character name from the base encoding
            int charID = this.baseEncoding[src];
            charName = FontSupport.getName(charID);
        }

        return font.getCachedGlyph(src, charName);
    }

    /**
     * Get a glyph from a CMap, given a Type0 font and a character
     */
    private PDFGlyph getGlyphFromCMap(PDFFont font, char src) {
        int fontID = this.cmap.getFontID(src);
        char charID = this.cmap.map(src);

        if (font instanceof Type0Font) {
            font = ((Type0Font) font).getDescendantFont(fontID);
        }

        return font.getCachedGlyph(charID, null);
    }

    /**
     * Parse a PDF encoding object for the actual encoding
     */
    public void parseEncoding(PDFObject encoding) throws IOException {
        this.differences = new HashMap<Character,String>();

        // figure out the base encoding, if one exists
        PDFObject baseEncObj = encoding.getDictRef("BaseEncoding");
        if (baseEncObj != null) {
            this.baseEncoding = getBaseEncoding(baseEncObj.getStringValue());
        }

        // parse the differences array
        PDFObject diffArrayObj = encoding.getDictRef("Differences");
        if (diffArrayObj != null) {
            PDFObject[] diffArray = diffArrayObj.getArray();
            int curPosition = -1;

            for (int i = 0; i < diffArray.length; i++) {
                if (diffArray[i].getType() == PDFObject.NUMBER) {
                    curPosition = diffArray[i].getIntValue();
                } else if (diffArray[i].getType() == PDFObject.NAME) {
                    Character key = Character.valueOf((char) curPosition);
                    this.differences.put(key, diffArray[i].getStringValue());
                    curPosition++;
                } else {
                    throw new IllegalArgumentException("Unexpected type in diff array: " + diffArray[i]);
                }
            }
        }
    }

    /** Get the base encoding for a given name */
    private int[] getBaseEncoding(String encodingName) {
        if (encodingName.equals("MacRomanEncoding")) {
            return FontSupport.macRomanEncoding;
        } else if (encodingName.equals("MacExpertEncoding")) {
            return FontSupport.type1CExpertCharset;
        } else if (encodingName.equals("WinAnsiEncoding")) {
            return FontSupport.winAnsiEncoding;
        } else if (encodingName.equals("StandardEncoding")) {
        	return FontSupport.standardEncoding; 
        } else if(encodingName.equals("SymbolSetEncoding")) {
            return FontSupport.symbolSetEncoding;
        } else {
            throw new IllegalArgumentException("Unknown encoding: " + encodingName);
        }
    }
}