/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.jena.fuseki.servlets; import static java.lang.String.format ; import java.io.IOException ; import java.io.InputStream ; import java.io.PrintWriter ; import java.util.zip.GZIPInputStream ; import javax.servlet.ServletException ; import javax.servlet.http.HttpServletRequest ; import javax.servlet.http.HttpServletResponse ; import org.apache.commons.fileupload.FileItemIterator ; import org.apache.commons.fileupload.FileItemStream ; import org.apache.commons.fileupload.servlet.ServletFileUpload ; import org.apache.commons.fileupload.util.Streams ; import org.apache.jena.atlas.lib.Pair ; import org.apache.jena.atlas.web.ContentType ; import org.apache.jena.fuseki.FusekiLib ; import org.apache.jena.fuseki.HttpNames ; import org.apache.jena.graph.Graph ; import org.apache.jena.graph.Node ; import org.apache.jena.graph.NodeFactory ; import org.apache.jena.iri.IRI ; import org.apache.jena.riot.Lang ; import org.apache.jena.riot.RDFLanguages ; import org.apache.jena.riot.lang.StreamRDFCounting ; import org.apache.jena.riot.system.* ; import org.apache.jena.sparql.core.Quad ; import org.apache.jena.sparql.graph.GraphFactory ; import org.apache.jena.web.HttpSC ; public class SPARQL_Upload extends SPARQL_ServletBase { private static ErrorHandler errorHandler = ErrorHandlerFactory.errorHandlerStd(log) ; public SPARQL_Upload() { super() ; } // Methods to respond to. @Override protected void doPost(HttpServletRequest request, HttpServletResponse response) throws ServletException, IOException { doCommon(request, response) ; } @Override protected void doOptions(HttpServletRequest request, HttpServletResponse response) { setCommonHeadersForOptions(response) ; response.setHeader(HttpNames.hAllow, "OPTIONS,POST"); response.setHeader(HttpNames.hContentLengh, "0") ; } @Override protected void perform(HttpAction action) { // Only allows one file in the upload. boolean isMultipart = ServletFileUpload.isMultipartContent(action.request); if ( ! isMultipart ) error(HttpSC.BAD_REQUEST_400 , "Not a file upload") ; long count = upload(action, "http://example/upload-base/") ; try { action.response.setContentType("text/html") ; action.response.setStatus(HttpSC.OK_200); PrintWriter out = action.response.getWriter() ; out.println("<html>") ; out.println("<head>") ; out.println("</head>") ; out.println("<body>") ; out.println("<h1>Success</h1>"); out.println("<p>") ; out.println("Triples = "+count + "\n"); out.println("<p>") ; out.println("</p>") ; out.println("<button onclick=\"timeFunction()\">Back to Fuseki</button>"); out.println("</p>") ; out.println("<script type=\"text/javascript\">"); out.println("function timeFunction(){"); out.println("window.location.href = \"/fuseki.html\";}"); out.println("</script>"); out.println("</body>") ; out.println("</html>") ; out.flush() ; success(action) ; } catch (Exception ex) { errorOccurred(ex) ; } } // Also used by SPARQL_REST static public long upload(HttpAction action, String base) { if ( action.isTransactional() ) return uploadTxn(action, base) ; else return uploadNonTxn(action, base) ; } /** Non-transaction - buffer to a temporary graph so that parse errors * are caught before inserting any data. */ private static long uploadNonTxn(HttpAction action, String base) { Pair<String, Graph> p = uploadWorker(action, base) ; String graphName = p.getLeft() ; Graph graphTmp = p.getRight() ; long tripleCount = graphTmp.size() ; log.info(format("[%d] Upload: Graph: %s (%d triple(s))", action.id, graphName, tripleCount)) ; Node gn = graphName.equals(HttpNames.valueDefault) ? Quad.defaultGraphNodeGenerated : NodeFactory.createURI(graphName) ; action.beginWrite() ; try { FusekiLib.addDataInto(graphTmp, action.getActiveDSG(), gn) ; action.commit() ; return tripleCount ; } catch (RuntimeException ex) { // If anything went wrong, try to backout. try { action.abort() ; } catch (Exception ex2) {} errorOccurred(ex.getMessage()) ; return -1 ; } finally { action.endWrite() ; } } /** Transactional - we'd like data to go straight to the destination, with an abort on parse error. * But file upload with a name means that the name can be after the data * (it is in the Fuseki default pages). * Use Graph Store protocol for bulk uploads. * (It would be possible to process the incoming stream and see the graph name first.) */ private static long uploadTxn(HttpAction action, String base) { // We can't do better than the non-transaction approach. return uploadNonTxn(action, base) ; } /** process an HTTP upload of RDF. * We can't stream straight into a dataset because the graph name can be after the data. * @return graph name and count */ static private Pair<String, Graph> uploadWorker(HttpAction action, String base) { Graph graphTmp = GraphFactory.createDefaultGraph() ; ServletFileUpload upload = new ServletFileUpload(); String graphName = null ; long count = -1 ; String name = null ; ContentType ct = null ; Lang lang = null ; try { FileItemIterator iter = upload.getItemIterator(action.request); while (iter.hasNext()) { FileItemStream item = iter.next(); String fieldName = item.getFieldName(); InputStream stream = item.openStream(); if (item.isFormField()) { // Graph name. String value = Streams.asString(stream, "UTF-8") ; if ( fieldName.equals(HttpNames.paramGraph) ) { graphName = value ; if ( graphName != null && ! graphName.equals("") && ! graphName.equals(HttpNames.valueDefault) ) { IRI iri = IRIResolver.parseIRI(value) ; if ( iri.hasViolation(false) ) errorBadRequest("Bad IRI: "+graphName) ; if ( iri.getScheme() == null ) errorBadRequest("Bad IRI: no IRI scheme name: "+graphName) ; if ( iri.getScheme().equalsIgnoreCase("http") || iri.getScheme().equalsIgnoreCase("https")) { // Redundant?? if ( iri.getRawHost() == null ) errorBadRequest("Bad IRI: no host name: "+graphName) ; if ( iri.getRawPath() == null || iri.getRawPath().length() == 0 ) errorBadRequest("Bad IRI: no path: "+graphName) ; if ( iri.getRawPath().charAt(0) != '/' ) errorBadRequest("Bad IRI: Path does not start '/': "+graphName) ; } } } else if ( fieldName.equals(HttpNames.paramDefaultGraphURI) ) graphName = null ; else // Add file type? log.info(format("[%d] Upload: Field=%s ignored", action.id, fieldName)) ; } else { // Process the input stream name = item.getName() ; if ( name == null || name.equals("") || name.equals("UNSET FILE NAME") ) errorBadRequest("No name for content - can't determine RDF syntax") ; String contentTypeHeader = item.getContentType() ; ct = ContentType.create(contentTypeHeader) ; lang = RDFLanguages.contentTypeToLang(ct.getContentType()) ; if ( lang == null ) { lang = RDFLanguages.filenameToLang(name) ; //JENA-600 filenameToLang() strips off certain extensions such as .gz and //we need to ensure that if there was a .gz extension present we wrap the stream accordingly if (name.endsWith(".gz")) stream = new GZIPInputStream(stream); } if ( lang == null ) // Desperate. lang = RDFLanguages.RDFXML ; log.info(format("[%d] Upload: Filename: %s, Content-Type=%s, Charset=%s => %s", action.id, name, ct.getContentType(), ct.getCharset(), lang.getName())) ; StreamRDF x = StreamRDFLib.graph(graphTmp) ; StreamRDFCounting dest = StreamRDFLib.count(x) ; SPARQL_REST.parse(action, dest, stream, lang, base); count = dest.count() ; } } if ( graphName == null || graphName.equals("") ) graphName = HttpNames.valueDefault ; return Pair.create(graphName, graphTmp) ; } catch (ActionErrorException ex) { throw ex ; } catch (Exception ex) { errorOccurred(ex) ; return null ; } } @Override protected void validate(HttpAction action) {} }