/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.jena.atlas.data; import java.io.File ; import java.util.ArrayList ; import java.util.Collections ; import java.util.Iterator ; import java.util.List ; import java.util.Random ; import junit.framework.TestCase ; import org.apache.jena.atlas.data.SortedDataBag ; import org.apache.jena.atlas.data.ThresholdPolicyCount ; import org.apache.jena.atlas.iterator.Iter ; import org.apache.jena.datatypes.xsd.XSDDatatype ; import org.apache.jena.graph.NodeFactory ; import org.junit.Test ; import org.apache.jena.query.Query ; import org.apache.jena.query.QueryCancelledException ; import org.apache.jena.query.SortCondition ; import org.apache.jena.riot.system.SerializationFactoryFinder ; import org.apache.jena.sparql.core.Var ; import org.apache.jena.sparql.engine.QueryIterator ; import org.apache.jena.sparql.engine.binding.Binding ; import org.apache.jena.sparql.engine.binding.BindingComparator ; import org.apache.jena.sparql.engine.binding.BindingFactory ; import org.apache.jena.sparql.engine.binding.BindingMap ; import org.apache.jena.sparql.expr.ExprVar ; public class TestSortedDataBag extends TestCase { private static final String LETTERS = "qwertyuiopasdfghjklzxcvbnmQWERTYUIOPASDFGHJKLZXCVBNM"; private Random random; @Test public void testSorting() { testSorting(500, 10); } private void testSorting(int numBindings, int threshold) { List<Binding> unsorted = randomBindings(numBindings); List<SortCondition> conditions = new ArrayList<>(); conditions.add(new SortCondition(new ExprVar("8"), Query.ORDER_ASCENDING)); conditions.add(new SortCondition(new ExprVar("1"), Query.ORDER_ASCENDING)); conditions.add(new SortCondition(new ExprVar("0"), Query.ORDER_DESCENDING)); BindingComparator comparator = new BindingComparator(conditions); List<Binding> sorted = new ArrayList<>(); SortedDataBag<Binding> db = new SortedDataBag<>( new ThresholdPolicyCount<Binding>(threshold), SerializationFactoryFinder.bindingSerializationFactory(), comparator); try { db.addAll(unsorted); Iterator<Binding> iter = db.iterator(); while (iter.hasNext()) { sorted.add(iter.next()); } Iter.close(iter); } finally { db.close(); } Collections.sort(unsorted, comparator); assertEquals(unsorted, sorted); } @Test public void testSortingWithPreMerge() { // Save the original value... int origMaxSpillFiles = SortedDataBag.MAX_SPILL_FILES; try { // Vary the number of spill files and bindings so we get a variable number of premerge rounds SortedDataBag.MAX_SPILL_FILES = 2; testSorting(1, 1); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(2, 1); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(3, 1); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(4, 1); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(5, 1); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(1, 10); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(1000, 10); SortedDataBag.MAX_SPILL_FILES = 100; testSorting(1000, 10); SortedDataBag.MAX_SPILL_FILES = 2; testSorting(10, 10); SortedDataBag.MAX_SPILL_FILES = 5; testSorting(10, 10); } finally { SortedDataBag.MAX_SPILL_FILES = origMaxSpillFiles; } } @Test public void testTemporaryFilesAreCleanedUpAfterCompletion() { List<Binding> unsorted = randomBindings(500); List<SortCondition> conditions = new ArrayList<>(); conditions.add(new SortCondition(new ExprVar("8"), Query.ORDER_ASCENDING)); BindingComparator comparator = new BindingComparator(conditions); SortedDataBag<Binding> db = new SortedDataBag<>( new ThresholdPolicyCount<Binding>(10), SerializationFactoryFinder.bindingSerializationFactory(), comparator); List<File> spillFiles = new ArrayList<>(); try { db.addAll(unsorted); spillFiles.addAll(db.getSpillFiles()); int count = 0; for (File file : spillFiles) { if (file.exists()) { count++; } } // 500 bindings divided into 50 chunks (49 in files, and 1 in memory) assertEquals(49, count); Iterator<Binding> iter = db.iterator(); while (iter.hasNext()) { iter.next(); } Iter.close(iter); } finally { db.close(); } int count = 0; for (File file : spillFiles) { if (file.exists()) { count++; } } assertEquals(0, count); } private List<Binding> randomBindings(int numBindings) { random = new Random(); Var[] vars = new Var[]{ Var.alloc("1"), Var.alloc("2"), Var.alloc("3"), Var.alloc("4"), Var.alloc("5"), Var.alloc("6"), Var.alloc("7"), Var.alloc("8"), Var.alloc("9"), Var.alloc("0") }; List<Binding> toReturn = new ArrayList<>(); for(int i = 0; i < numBindings; i++){ toReturn.add(randomBinding(vars)); } return toReturn; } private Binding randomBinding(Var[] vars) { BindingMap binding = BindingFactory.create(); binding.add(vars[0], NodeFactory.createBlankNode()); binding.add(vars[1], NodeFactory.createURI(randomURI())); binding.add(vars[2], NodeFactory.createURI(randomURI())); binding.add(vars[3], NodeFactory.createLiteral(randomString(20))); binding.add(vars[4], NodeFactory.createBlankNode()); binding.add(vars[5], NodeFactory.createURI(randomURI())); binding.add(vars[6], NodeFactory.createURI(randomURI())); binding.add(vars[7], NodeFactory.createLiteral(randomString(5))); binding.add(vars[8], NodeFactory.createLiteral("" + random.nextInt(), XSDDatatype.XSDinteger)); binding.add(vars[9], NodeFactory.createBlankNode()); return binding; } private String randomURI() { return String.format("http://%s.example.com/%s", randomString(10), randomString(10)); } private String randomString(int length) { StringBuilder builder = new StringBuilder(); for(int i = 0; i < length; i++){ builder.append(LETTERS.charAt(random.nextInt(LETTERS.length()))); } return builder.toString(); } private void getNextAndExpectException(QueryIterator iter) { try{ iter.hasNext(); fail("Expected an exception here"); }catch(QueryCancelledException e){ // expected }catch(Exception e){ fail("Unexpected exception"); } } }