//Dstl (c) Crown Copyright 2017
package uk.gov.dstl.baleen.contentmappers;
import org.apache.uima.jcas.JCas;
import org.jsoup.nodes.Element;
import com.google.common.base.Strings;
import uk.gov.dstl.baleen.contentmappers.helpers.AnnotationCollector;
import uk.gov.dstl.baleen.contentmappers.helpers.ContentMapper;
import uk.gov.dstl.baleen.types.metadata.Metadata;
/**
* Convert from meta tags into a Metadata annotation, retaining the key (name) and value (content or
* charset) attributes.
*/
public class MetaTags implements ContentMapper {
@Override
public void map(JCas jCas, Element element, AnnotationCollector collector) {
if("meta".equalsIgnoreCase(element.tagName())){
Metadata md = new Metadata(jCas);
String name = element.attr("name");
md.setKey(name);
String content = element.attr("content");
String charset = element.attr("charset");
if (!Strings.isNullOrEmpty(content)) {
md.setValue(content);
} else if (!Strings.isNullOrEmpty(charset)) {
md.setValue(charset);
}
collector.add(md);
}
}
}