/* * This program is free software; you can redistribute it and/or modify it under the * terms of the GNU Lesser General Public License, version 2.1 as published by the Free Software * Foundation. * * You should have received a copy of the GNU Lesser General Public License along with this * program; if not, you can obtain a copy at http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html * or from the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. * * This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; * without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * See the GNU Lesser General Public License for more details. * * Copyright (c) 2001 - 2017 Object Refinery Ltd, Pentaho Corporation and Contributors.. All rights reserved. */ package org.pentaho.reporting.engine.classic.core.modules.output.table.html.util; import org.pentaho.reporting.libraries.xmlns.writer.CharacterEntityParser; import java.util.Properties; /** * A collection of all character entites defined in the HTML4 standard. The key is the entity name, the property value * is the decoded string. * * @author Thomas Morgner */ public class HtmlCharacterEntities extends Properties { /** * The singleton instance for this entity-parser implementation. */ private static CharacterEntityParser entityParser; /** * Gets the character entity parser for HTML content. The CharacterEntity parser translates known characters into * predefined entities. * * @return the character entity parser instance. */ public static synchronized CharacterEntityParser getEntityParser() { if ( entityParser == null ) { entityParser = new CharacterEntityParser( new HtmlCharacterEntities() ); } return entityParser; } private void addAccentedCharacters() { setProperty( "acute", "\u00b4" ); setProperty( "cedil", "\u00b8" ); setProperty( "circ", "\u02c6" ); setProperty( "macr", "\u00af" ); setProperty( "middot", "\u00b7" ); setProperty( "tilde", "\u02dc" ); setProperty( "uml", "\u00a8" ); setProperty( "Aacute", "\u00c1" ); setProperty( "aacute", "\u00e1" ); setProperty( "Acirc", "\u00c2" ); setProperty( "acirc", "\u00e2" ); setProperty( "AElig", "\u00c6" ); setProperty( "aelig", "\u00e6" ); setProperty( "Agrave", "\u00c0" ); setProperty( "agrave", "\u00e0" ); setProperty( "Aring", "\u00c5" ); setProperty( "aring", "\u00e5" ); setProperty( "atilde", "\u00e3" ); setProperty( "Atilde", "\u00c3" ); setProperty( "Auml", "\u00c4" ); setProperty( "auml", "\u00e4" ); setProperty( "ccedil", "\u00e7" ); setProperty( "Ccedil", "\u00c7" ); setProperty( "Eacute", "\u00c9" ); setProperty( "eacute", "\u00e9" ); setProperty( "Ecirc", "\u00ca" ); setProperty( "ecirc", "\u00ea" ); setProperty( "Egrave", "\u00c8" ); setProperty( "egrave", "\u00e8" ); setProperty( "ETH", "\u00d0" ); setProperty( "eth", "\u00f0" ); setProperty( "Euml", "\u00cb" ); setProperty( "euml", "\u00eb" ); setProperty( "Iacute", "\u00cd" ); setProperty( "iacute", "\u00ed" ); setProperty( "Icirc", "\u00ce" ); setProperty( "icirc", "\u00ee" ); setProperty( "Igrave", "\u00cc" ); setProperty( "igrave", "\u00ec" ); setProperty( "Iuml", "\u00cf" ); setProperty( "iuml", "\u00ef" ); setProperty( "Ntilde", "\u00d1" ); setProperty( "ntilde", "\u00f1" ); setProperty( "Oacute", "\u00d3" ); setProperty( "oacute", "\u00f3" ); setProperty( "Ocirc", "\u00d4" ); setProperty( "ocirc", "\u00f4" ); setProperty( "Oelig", "\u0152" ); setProperty( "oelig", "\u0153" ); setProperty( "Ograve", "\u00d2" ); setProperty( "ograve", "\u00f2" ); setProperty( "Oslash", "\u00d8" ); setProperty( "oslash", "\u00f8" ); setProperty( "Otilde", "\u00d5" ); setProperty( "otilde", "\u00f5" ); setProperty( "Ouml", "\u00d6" ); setProperty( "ouml", "\u00f6" ); setProperty( "Scaron", "\u0160" ); setProperty( "scaron", "\u0161" ); setProperty( "szlig", "\u00df" ); setProperty( "THORN", "\u00de" ); setProperty( "thorn", "\u00fe" ); setProperty( "Uacute", "\u00da" ); setProperty( "uacute", "\u00fa" ); setProperty( "Ucirc", "\u00db" ); setProperty( "ucirc", "\u00fb" ); setProperty( "Ugrave", "\u00d9" ); setProperty( "ugrave", "\u00f9" ); setProperty( "Uuml", "\u00dc" ); setProperty( "uuml", "\u00fc" ); setProperty( "Yacute", "\u00dd" ); setProperty( "yacute", "\u00fd" ); setProperty( "Yuml", "\u0178" ); setProperty( "yuml", "\u00ff" ); } /** * Creates an instance. * <p/> * Source: http://www.cookwood.com/html/extras/entities.html */ public HtmlCharacterEntities() { // Characters with special meaning setProperty( "amp", "\u0026" ); setProperty( "gt", "\u003e" ); setProperty( "lt", "\u003c" ); setProperty( "quot", "\"" ); // Entities for accented characters, accents, and other diacritics from Western European Languages addAccentedCharacters(); // Entities for punctuation characters addPunctuationCharacters(); // Entities for mathematical and technical characters (including Greek) addMathCharacters(); // Entities for shapes and arrows setProperty( "crarr", "\u21b5" ); setProperty( "darr", "\u2193" ); setProperty( "dArr", "\u21d3" ); setProperty( "harr", "\u2194" ); setProperty( "hArr", "\u21d4" ); setProperty( "larr", "\u2190" ); setProperty( "lArr", "\u21d0" ); setProperty( "rarr", "\u2192" ); setProperty( "rArr", "\u21d2" ); setProperty( "uarr", "\u2191" ); setProperty( "uArr", "\u21d1" ); setProperty( "clubs", "\u2663" ); setProperty( "diams", "\u2666" ); setProperty( "hearts", "\u2665" ); setProperty( "spades", "\u2660" ); setProperty( "loz", "\u25ca" ); setProperty( "rlm", "\u200f" ); setProperty( "prop", "\u221d" ); } private void addMathCharacters() { setProperty( "deg", "\u00b0" ); setProperty( "divide", "\u00f7" ); setProperty( "frac12", "\u00bd" ); setProperty( "frac14", "\u00bc" ); setProperty( "frac34", "\u00be" ); setProperty( "ge", "\u2265" ); setProperty( "le", "\u2264" ); setProperty( "minus", "\u2212" ); setProperty( "sup2", "\u00b2" ); setProperty( "sup3", "\u00b3" ); setProperty( "times", "\u00d7" ); setProperty( "alefsym", "\u2135" ); setProperty( "and", "\u2227" ); setProperty( "ang", "\u2220" ); setProperty( "asymp", "\u2248" ); setProperty( "cap", "\u2229" ); setProperty( "cong", "\u2245" ); setProperty( "cup", "\u222a" ); setProperty( "empty", "\u2205" ); setProperty( "equiv", "\u2261" ); setProperty( "exist", "\u2203" ); setProperty( "fnof", "\u0192" ); setProperty( "forall", "\u2200" ); setProperty( "infin", "\u221e" ); setProperty( "int", "\u222b" ); setProperty( "isin", "\u2208" ); setProperty( "lang", "\u2329" ); setProperty( "lceil", "\u2308" ); setProperty( "lfloor", "\u22a6" ); setProperty( "lowast", "\u2217" ); setProperty( "micro", "\u00b5" ); setProperty( "nabla", "\u2207" ); setProperty( "ne", "\u2260" ); setProperty( "ni", "\u220b" ); setProperty( "notin", "\u2209" ); setProperty( "nsub", "\u2284" ); setProperty( "oplus", "\u2295" ); setProperty( "or", "\u2228" ); setProperty( "otimes", "\u2297" ); setProperty( "part", "\u2202" ); setProperty( "perp", "\u22a5" ); setProperty( "plusmn", "\u00b1" ); setProperty( "prod", "\u220f" ); setProperty( "radic", "\u221a" ); setProperty( "rang", "\u232a" ); setProperty( "rceil", "\u2309" ); setProperty( "rfloor", "\u22a7" ); setProperty( "sdot", "\u22c5" ); setProperty( "sim", "\u223c" ); setProperty( "sub", "\u2282" ); setProperty( "sube", "\u2286" ); setProperty( "sum", "\u2211" ); setProperty( "sup", "\u2283" ); setProperty( "supe", "\u2287" ); setProperty( "there4", "\u2234" ); setProperty( "Alpha", "\u0391" ); setProperty( "alpha", "\u03b1" ); setProperty( "Beta", "\u0392" ); setProperty( "beta", "\u03b2" ); setProperty( "Chi", "\u03a7" ); setProperty( "chi", "\u03c7" ); setProperty( "Delta", "\u0394" ); setProperty( "delta", "\u03b4" ); setProperty( "Epsilon", "\u0395" ); setProperty( "epsilon", "\u03b5" ); setProperty( "Eta", "\u0397" ); setProperty( "eta", "\u03b7" ); setProperty( "Gamma", "\u0393" ); setProperty( "gamma", "\u03b3" ); setProperty( "Iota", "\u0399" ); setProperty( "iota", "\u03b9" ); setProperty( "Kappa", "\u039a" ); setProperty( "kappa", "\u03ba" ); setProperty( "Lambda", "\u039b" ); setProperty( "lambda", "\u03bb" ); setProperty( "Mu", "\u039c" ); setProperty( "mu", "\u03bc" ); setProperty( "Nu", "\u039d" ); setProperty( "nu", "\u03bd" ); setProperty( "Omega", "\u03a9" ); setProperty( "omega", "\u03c9" ); setProperty( "Omicron", "\u039f" ); setProperty( "omicron", "\u03bf" ); setProperty( "Phi", "\u03a6" ); setProperty( "phi", "\u03c6" ); setProperty( "Pi", "\u03a0" ); setProperty( "pi", "\u03c0" ); setProperty( "piv", "\u03d6" ); setProperty( "Psi", "\u03a8" ); setProperty( "psi", "\u03c8" ); setProperty( "Rho", "\u03a1" ); setProperty( "rho", "\u03c1" ); setProperty( "Sigma", "\u03a3" ); setProperty( "sigma", "\u03c3" ); setProperty( "sigmaf", "\u03c2" ); setProperty( "Tau", "\u03a4" ); setProperty( "tau", "\u03c4" ); setProperty( "Theta", "\u0398" ); setProperty( "theta", "\u03b8" ); setProperty( "thetasym", "\u03d1" ); setProperty( "upsih", "\u03d2" ); setProperty( "Upsilon", "\u03a5" ); setProperty( "upsilon", "\u03c5" ); setProperty( "Xi", "\u039e" ); setProperty( "xi", "\u03be" ); setProperty( "Zeta", "\u0396" ); setProperty( "zeta", "\u03b6" ); } private void addPunctuationCharacters() { setProperty( "cent", "\u00a2" ); setProperty( "curren", "\u00a4" ); setProperty( "euro", "\u20ac" ); setProperty( "pound", "\u00a3" ); setProperty( "yen", "\u00a5" ); setProperty( "brvbar", "\u00a6" ); setProperty( "bull", "\u2022" ); setProperty( "copy", "\u00a9" ); setProperty( "dagger", "\u2020" ); setProperty( "Dagger", "\u2021" ); setProperty( "frasl", "\u2044" ); setProperty( "hellip", "\u2026" ); setProperty( "iexcl", "\u00a1" ); setProperty( "image", "\u2111" ); setProperty( "iquest", "\u00bf" ); setProperty( "lrm", "\u200e" ); setProperty( "mdash", "\u2014" ); setProperty( "ndash", "\u2013" ); setProperty( "not", "\u00ac" ); setProperty( "oline", "\u203e" ); setProperty( "ordf", "\u00aa" ); setProperty( "ordm", "\u00ba" ); setProperty( "para", "\u00b6" ); setProperty( "permil", "\u2030" ); setProperty( "prime", "\u2032" ); setProperty( "Prime", "\u2033" ); setProperty( "real", "\u211c" ); setProperty( "reg", "\u00ae" ); setProperty( "rim", "\u8207" ); setProperty( "sect", "\u00a7" ); setProperty( "shy", "\u00ad" ); setProperty( "sup1", "\u00b9" ); setProperty( "trade", "\u2122" ); setProperty( "weierp", "\u2118" ); setProperty( "bdquo", "\u201e" ); setProperty( "laquo", "\u00ab" ); setProperty( "ldquo", "\u201c" ); setProperty( "lsaquo", "\u2039" ); setProperty( "lsquo", "\u2018" ); setProperty( "raquo", "\u00bb" ); setProperty( "rdquo", "\u201d" ); setProperty( "rsaquo", "\u203a" ); setProperty( "rsquo", "\u2019" ); setProperty( "sbquo", "\u201a" ); setProperty( "emsp", "\u2003" ); setProperty( "ensp", "\u2002" ); setProperty( "nbsp", "\u00a0" ); setProperty( "thinsp", "\u2009" ); setProperty( "zwj", "\u200d" ); setProperty( "zwnj", "\u200c" ); } }