/* * This file is part of ELKI: * Environment for Developing KDD-Applications Supported by Index-Structures * * Copyright (C) 2017 * ELKI Development Team * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. */ package de.lmu.ifi.dbs.elki.datasource.parser; import java.io.IOException; import java.io.InputStream; import de.lmu.ifi.dbs.elki.database.ids.DBIDVar; import de.lmu.ifi.dbs.elki.datasource.bundle.MultipleObjectsBundle; import de.lmu.ifi.dbs.elki.logging.Logging; import de.lmu.ifi.dbs.elki.utilities.ClassGenericsUtil; import de.lmu.ifi.dbs.elki.utilities.io.TokenizedReader; import de.lmu.ifi.dbs.elki.utilities.io.Tokenizer; import de.lmu.ifi.dbs.elki.utilities.optionhandling.AbstractParameterizer; import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization; /** * Base class for streaming parsers. * * @author Erich Schubert * @since 0.4.0 * * @apiviz.uses CSVReaderFormat * @apiviz.composedOf TokenizedReader * @apiviz.composedOf Tokenizer */ public abstract class AbstractStreamingParser implements StreamingParser { /** * Tokenized reader. */ protected TokenizedReader reader; /** * Tokenizer. */ protected Tokenizer tokenizer; /** * Constructor. * * @param format Reader format */ public AbstractStreamingParser(CSVReaderFormat format) { super(); this.reader = format.makeReader(); this.tokenizer = reader.getTokenizer(); } @Override final public MultipleObjectsBundle parse(InputStream in) { this.initStream(in); return MultipleObjectsBundle.fromStream(this); } @Override public void initStream(InputStream in) { reader.reset(in); } @Override public boolean hasDBIDs() { return false; } @Override public boolean assignDBID(DBIDVar var) { var.unset(); return false; } @Override public MultipleObjectsBundle asMultipleObjectsBundle() { return MultipleObjectsBundle.fromStream(this); } @Override public void cleanup() { try { reader.close(); } catch(IOException e) { getLogger().exception(e); } } /** * Get the logger for this class. * * @return Logger. */ protected abstract Logging getLogger(); /** * Parameterization class. * * @author Erich Schubert * * @apiviz.exclude */ public abstract static class Parameterizer extends AbstractParameterizer { /** * Reader format. */ protected CSVReaderFormat format; @Override protected void makeOptions(Parameterization config) { super.makeOptions(config); format = ClassGenericsUtil.parameterizeOrAbort(CSVReaderFormat.class, config); } @Override protected abstract AbstractStreamingParser makeInstance(); } }