/* $RCSfile$ * $Author$ * $Date$ * $Revision$ * * Copyright (C) 2004-2007 The Chemistry Development Kit (CDK) project * * Contact: cdk-devel@lists.sourceforge.net * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public License * as published by the Free Software Foundation; either version 2.1 * of the License, or (at your option) any later version. * All we ask is that proper credit is given for our work, which includes * - but is not limited to - adding the above copyright notice to the beginning * of your source code files, and to any copyright notice that you may distribute * with programs based on this work. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * */ package org.openscience.cdk.io; import java.io.BufferedReader; import java.io.IOException; import java.io.InputStream; import java.io.InputStreamReader; import java.io.Reader; import java.io.StringReader; import java.util.StringTokenizer; import org.openscience.cdk.annotations.TestClass; import org.openscience.cdk.annotations.TestMethod; import org.openscience.cdk.exception.CDKException; import org.openscience.cdk.interfaces.IAtomContainer; import org.openscience.cdk.interfaces.IChemFile; import org.openscience.cdk.interfaces.IChemModel; import org.openscience.cdk.interfaces.IChemObject; import org.openscience.cdk.interfaces.IChemSequence; import org.openscience.cdk.interfaces.IMoleculeSet; import org.openscience.cdk.io.formats.INChIPlainTextFormat; import org.openscience.cdk.io.formats.IResourceFormat; import org.openscience.cdk.io.inchi.INChIContentProcessorTool; /** * Reads the content of a IUPAC/NIST Chemical Identifier (INChI) plain text * document. This reader parses output generated with INChI 1.12beta like: * <pre> * * Input_File: "E:\Program Files\INChI\inchi-samples\Figure04.mol" * * Structure: 1 * INChI=1.12Beta/C6H6/c1-2-4-6-5-3-1/h1-6H * AuxInfo=1.12Beta/0/N:1,2,3,4,5,6/E:(1,2,3,4,5,6)/rA:6CCCCCC/rB:s1;d1;d2;s3;s4d5;/rC:5.6378,-4.0013,0;5.6378,-5.3313,0;4.4859,-3.3363,0;4.4859,-5.9963,0;3.3341,-4.0013,0;3.3341,-5.3313,0; * </pre> * * @cdk.module extra * @cdk.githash * * @author Egon Willighagen <egonw@sci.kun.nl> * @cdk.created 2004-08-01 * * @cdk.keyword file format, INChI * @cdk.keyword chemical identifier * @cdk.require java1.4+ * * @see org.openscience.cdk.io.INChIReader */ @TestClass("org.openscience.cdk.io.INChIPlainTextReaderTest") public class INChIPlainTextReader extends DefaultChemObjectReader { private BufferedReader input; private INChIContentProcessorTool inchiTool; /** * Construct a INChI reader from a Reader object. * * @param input the Reader with the content */ public INChIPlainTextReader(Reader input) { this.init(); setReader(input); inchiTool = new INChIContentProcessorTool(); } public INChIPlainTextReader(InputStream input) { this(new InputStreamReader(input)); } public INChIPlainTextReader() { this(new StringReader("")); } @TestMethod("testGetFormat") public IResourceFormat getFormat() { return INChIPlainTextFormat.getInstance(); } @TestMethod("testSetReader_Reader") public void setReader(Reader input) { if (input instanceof BufferedReader) { this.input = (BufferedReader)input; } else { this.input = new BufferedReader(input); } } @TestMethod("testSetReader_InputStream") public void setReader(InputStream input) throws CDKException { setReader(new InputStreamReader(input)); } /** * Initializes this reader. */ private void init() {} @TestMethod("testAccepts") public boolean accepts(Class classObject) { Class[] interfaces = classObject.getInterfaces(); for (int i=0; i<interfaces.length; i++) { if (IChemFile.class.equals(interfaces[i])) return true; } Class superClass = classObject.getSuperclass(); if (superClass != null) return this.accepts(superClass); return false; } /** * Reads a IChemObject of type object from input. * Supported types are: ChemFile. * * @param object type of requested IChemObject * @return the content in a ChemFile object */ public IChemObject read(IChemObject object) throws CDKException { if (object instanceof IChemFile) { return (IChemObject)readChemFile((IChemFile)object); } else { throw new CDKException("Only supported is reading of ChemFile objects."); } } // private functions /** * Reads a ChemFile object from input. * * @return ChemFile with the content read from the input */ private IChemFile readChemFile(IChemFile cf) throws CDKException { // have to do stuff here try { String line = null; while ((line = input.readLine())!=null) { if (line.startsWith("INChI=") || line.startsWith("InChI=")) { // ok, the fun starts cf = cf.getBuilder().newChemFile(); // ok, we need to parse things like: // INChI=1.12Beta/C6H6/c1-2-4-6-5-3-1/h1-6H final String INChI = line.substring(6); StringTokenizer tokenizer = new StringTokenizer(INChI, "/"); // ok, we expect 4 tokens tokenizer.nextToken(); // 1.12Beta not stored since never used final String formula = tokenizer.nextToken(); // C6H6 final String connections = tokenizer.nextToken().substring(1); // 1-2-4-6-5-3-1 //final String hydrogens = tokenizer.nextToken().substring(1); // 1-6H IAtomContainer parsedContent = inchiTool.processFormula( cf.getBuilder().newAtomContainer(), formula ); inchiTool.processConnections(connections, parsedContent, -1); IMoleculeSet moleculeSet = cf.getBuilder().newMoleculeSet(); moleculeSet.addMolecule(cf.getBuilder().newMolecule(parsedContent)); IChemModel model = cf.getBuilder().newChemModel(); model.setMoleculeSet(moleculeSet); IChemSequence sequence = cf.getBuilder().newChemSequence(); sequence.addChemModel(model); cf.addChemSequence(sequence); } } } catch (Exception exception) { exception.printStackTrace(); throw new CDKException("Error while reading INChI file: " + exception.getMessage(), exception); } return cf; } @TestMethod("testClose") public void close() throws IOException { input.close(); } }