/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jena.riot.lang;
import java.io.IOException ;
import java.io.InputStream ;
import java.io.Reader ;
import org.apache.jena.atlas.io.IO ;
import org.apache.jena.atlas.lib.Pair ;
import org.apache.jena.datatypes.RDFDatatype ;
import org.apache.jena.datatypes.TypeMapper ;
import org.apache.jena.graph.Node ;
import org.apache.jena.graph.NodeFactory ;
import org.apache.jena.graph.Triple ;
import org.apache.jena.rdf.model.RDFErrorHandler ;
import org.apache.jena.rdfxml.xmlinput.* ;
import org.apache.jena.rdfxml.xmlinput.impl.ARPSaxErrorHandler ;
import org.apache.jena.riot.Lang ;
import org.apache.jena.riot.RDFLanguages ;
import org.apache.jena.riot.checker.CheckerLiterals ;
import org.apache.jena.riot.system.ErrorHandler ;
import org.apache.jena.riot.system.ParserProfile ;
import org.apache.jena.riot.system.RiotLib ;
import org.apache.jena.riot.system.StreamRDF ;
import org.xml.sax.SAXException ;
import org.xml.sax.SAXParseException ;
/** RDF/XML.
*
* @see <a href="http://www.w3.org/TR/rdf-syntax-grammar/">http://www.w3.org/TR/rdf-syntax-grammar/</a>
*/
public class LangRDFXML implements LangRIOT
{
// This is not a full member of the RIOT suite because it needs to work
// with Xerces and already carries out it's own error handling and output
private ARP arp = new ARP() ;
private InputStream input = null ;
private Reader reader = null ;
private String xmlBase ;
private String filename ;
private StreamRDF sink ;
private ParserProfile profile ; // Warning - we don't use all of this.
@Override
public ParserProfile getProfile()
{
return profile ;
}
@Override
public void setProfile(ParserProfile profile)
{ this.profile = profile ; }
public static LangRDFXML create(InputStream in, String xmlBase, String filename, ErrorHandler errorHandler, StreamRDF sink) {
return new LangRDFXML(in, xmlBase, filename, errorHandler, sink) ;
}
public static LangRDFXML create(Reader reader, String xmlBase, String filename, ErrorHandler errorHandler, StreamRDF sink) {
return new LangRDFXML(reader, xmlBase, filename, errorHandler, sink) ;
}
public static LangRDFXML create(String xmlBase, String filename, ErrorHandler errorHandler, StreamRDF sink) {
return create(IO.openFile(filename), xmlBase, filename, errorHandler, sink) ;
}
private LangRDFXML(Reader reader, String xmlBase, String filename, ErrorHandler errorHandler, StreamRDF sink) {
this.reader = reader ;
this.xmlBase = xmlBase ;
this.filename = filename ;
this.sink = sink ;
this.profile = RiotLib.profile(getLang(), xmlBase, errorHandler) ;
}
private LangRDFXML(InputStream in, String xmlBase, String filename, ErrorHandler errorHandler, StreamRDF sink) {
this.input = in ;
this.xmlBase = xmlBase ;
this.filename = filename ;
this.sink = sink ;
this.profile = RiotLib.profile(getLang(), xmlBase, errorHandler) ;
}
@Override
public Lang getLang() { return RDFLanguages.RDFXML ; }
public static boolean RiotUniformCompatibility = false ;
// Warnings in ARP that should be errors to be compatible with
// non-XML-based languages. e.g. language tags should be
// syntactically valid.
private static int[] additionalErrors = new int[] {
ARPErrorNumbers.WARN_MALFORMED_XMLLANG
//, ARPErrorNumbers.WARN_STRING_NOT_NORMAL_FORM_C
} ;
@Override
public void parse() {
// Hacked out of ARP because of all the "private" methods
sink.start() ;
HandlerSink rslt = new HandlerSink(sink, getProfile().getHandler()) ;
arp.getHandlers().setStatementHandler(rslt) ;
arp.getHandlers().setErrorHandler(rslt) ;
arp.getHandlers().setNamespaceHandler(rslt) ;
if ( RiotUniformCompatibility ) {
ARPOptions options = arp.getOptions() ;
// Convert some warnings to errors for compatible behaviour for all parsers.
for ( int code : additionalErrors )
options.setErrorMode(code, ARPErrorNumbers.EM_FATAL) ;
arp.setOptionsWith(options) ;
}
try {
if ( reader != null )
arp.load(reader, xmlBase) ;
else
arp.load(input, xmlBase) ;
}
catch (IOException e) {
getProfile().getHandler().error(filename + ": " + ParseException.formatMessage(e), -1, -1) ;
}
catch (SAXParseException e) {
// already reported.
}
catch (SAXException sax) {
getProfile().getHandler().error(filename + ": " + ParseException.formatMessage(sax), -1, -1) ;
}
sink.finish() ;
}
private static class HandlerSink extends ARPSaxErrorHandler implements StatementHandler, NamespaceHandler {
private StreamRDF output ;
private ErrorHandler errHandler ;
private CheckerLiterals checker ;
HandlerSink(StreamRDF output, ErrorHandler errHandler) {
super(new ErrorHandlerBridge(errHandler)) ;
this.output = output ;
this.errHandler = errHandler ;
this.checker = new CheckerLiterals(errHandler) ;
}
@Override
public void statement(AResource subj, AResource pred, AResource obj)
{ output.triple(convert(subj, pred, obj)); }
@Override
public void statement(AResource subj, AResource pred, ALiteral lit)
{ output.triple(convert(subj, pred, lit)) ; }
// From JenaReader
private static Node convert(ALiteral lit) {
String dtURI = lit.getDatatypeURI();
if (dtURI == null)
return NodeFactory.createLiteral(lit.toString(), lit.getLang());
if (lit.isWellFormedXML()) {
return NodeFactory.createLiteral(lit.toString(), null, true);
}
RDFDatatype dt = TypeMapper.getInstance().getSafeTypeByName(dtURI);
return NodeFactory.createLiteral(lit.toString(), dt);
}
private static Node convert(AResource r) {
if (!r.isAnonymous())
return NodeFactory.createURI(r.getURI());
// String id = r.getAnonymousID();
Node rr = (Node) r.getUserData();
if (rr == null) {
rr = NodeFactory.createBlankNode();
r.setUserData(rr);
}
return rr;
}
private Triple convert(AResource s, AResource p, AResource o) {
return Triple.create(convert(s), convert(p), convert(o)) ;
}
private Triple convert(AResource s, AResource p, ALiteral o) {
Node object = convert(o) ;
checker.check(object, -1, -1) ;
return Triple.create(convert(s), convert(p), object) ;
}
@Override
public void startPrefixMapping(String prefix, String uri) {
output.prefix(prefix, uri) ;
}
@Override
public void endPrefixMapping(String prefix) {}
}
private static class ErrorHandlerBridge implements RDFErrorHandler {
private ErrorHandler errorHandler ;
ErrorHandlerBridge(ErrorHandler hander) {
this.errorHandler = hander ;
}
@Override
public void warning(Exception e) {
Pair<Integer, Integer> p = getLineCol(e) ;
errorHandler.warning(e.getMessage(), p.getLeft(), p.getRight()) ;
}
@Override
public void error(Exception e) {
Pair<Integer, Integer> p = getLineCol(e) ;
errorHandler.error(e.getMessage(), p.getLeft(), p.getRight()) ;
}
@Override
public void fatalError(Exception e) {
Pair<Integer, Integer> p = getLineCol(e) ;
errorHandler.fatal(e.getMessage(), p.getLeft(), p.getRight()) ;
}
private static Pair<Integer, Integer> getLineCol(Exception e) {
if ( e instanceof SAXParseException ) {
SAXParseException esax = (SAXParseException)e ;
return Pair.create(esax.getLineNumber(), esax.getColumnNumber()) ;
} else {
return Pair.create(-1, -1) ;
}
}
}
}