package org.jabref.logic.formatter.bibtexfields; import org.jabref.logic.l10n.Localization; import org.jabref.logic.layout.LayoutFormatter; import org.jabref.model.cleanup.Formatter; import org.apache.commons.lang3.StringEscapeUtils; public class HtmlToUnicodeFormatter implements LayoutFormatter, Formatter { @Override public String getName() { return "HTML to Unicode"; } @Override public String getKey() { return "html_to_unicode"; } @Override public String getDescription() { return Localization.lang("Converts HTML code to Unicode."); } @Override public String getExampleInput() { return "<b>bread</b> & butter"; } @Override public String format(String fieldText) { // StringEscapeUtils converts characters and regex kills tags return StringEscapeUtils.unescapeHtml4(fieldText).replaceAll("\\<[^>]*>",""); } }