/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.jackrabbit.core.query.lucene; import java.io.ByteArrayInputStream; import java.io.ByteArrayOutputStream; import java.io.IOException; import java.io.InputStream; import java.io.OutputStreamWriter; import java.util.Calendar; import javax.jcr.Node; import javax.jcr.RepositoryException; import javax.jcr.nodetype.NodeType; import javax.jcr.query.InvalidQueryException; import javax.jcr.query.Query; import org.apache.jackrabbit.core.query.AbstractIndexingTest; import org.apache.jackrabbit.core.query.FulltextQueryTest; public class TextExtractionQueryTest extends AbstractIndexingTest { public void testFileContains() throws Exception { assertFileContains("test.txt", "text/plain", "AE502DBEA2C411DEBD340AD156D89593"); assertFileContains("test.rtf", "application/rtf", "quick brown fox"); } public void testNtFile() throws RepositoryException, IOException { Node file = testRootNode.addNode(nodeName1, "nt:file"); Node resource = file.addNode("jcr:content", "nt:resource"); resource.setProperty("jcr:encoding", "UTF-8"); resource.setProperty("jcr:mimeType", "text/plain"); ByteArrayOutputStream data = new ByteArrayOutputStream(); OutputStreamWriter writer = new OutputStreamWriter(data, "UTF-8"); writer.write("The quick brown fox jumps over the lazy dog."); writer.close(); resource.setProperty("jcr:data", new ByteArrayInputStream(data.toByteArray())); resource.setProperty("jcr:lastModified", Calendar.getInstance()); testRootNode.save(); String xpath = testPath + "/*[jcr:contains(jcr:content, 'lazy')]"; executeXPathQuery(xpath, new Node[]{file}); } private void assertFileContains(String name, String type, String... statements) throws Exception { while (testRootNode.hasNode(nodeName1)) { testRootNode.getNode(nodeName1).remove(); } Node resource = testRootNode.addNode(nodeName1, NodeType.NT_RESOURCE); resource.setProperty("jcr:mimeType", type); InputStream stream = FulltextQueryTest.class.getResourceAsStream(name); try { resource.setProperty("jcr:data", stream); } finally { stream.close(); } testRootNode.save(); flushSearchIndex(); for (String statement : statements) { assertContainsQuery(statement, true); } } private void assertContainsQuery(String statement, boolean match) throws InvalidQueryException, RepositoryException { StringBuffer stmt = new StringBuffer(); stmt.append("/jcr:root").append(testRoot).append("/*"); stmt.append("[jcr:contains(., '").append(statement); stmt.append("')]"); Query q = qm.createQuery(stmt.toString(), Query.XPATH); checkResult(q.execute(), match ? 1 : 0); stmt = new StringBuffer(); stmt.append("SELECT * FROM nt:base "); stmt.append("WHERE jcr:path LIKE '").append(testRoot).append("/%' "); stmt.append("AND CONTAINS(., '").append(statement).append("')"); q = qm.createQuery(stmt.toString(), Query.SQL); checkResult(q.execute(), match ? 1 : 0); } }