/*************************************************************************
* *
* This file is part of the 20n/act project. *
* 20n/act enables DNA prediction for synthetic biology/bioengineering. *
* Copyright (C) 2017 20n Labs, Inc. *
* *
* Please direct all queries to act@20n.com. *
* *
* This program is free software: you can redistribute it and/or modify *
* it under the terms of the GNU General Public License as published by *
* the Free Software Foundation, either version 3 of the License, or *
* (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program. If not, see <http://www.gnu.org/licenses/>. *
* *
*************************************************************************/
package com.act.biointerpretation.sars;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.fasterxml.jackson.databind.SerializationFeature;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Iterator;
import java.util.List;
/**
* Represents a corpus of reaction groups. This should serve as the intermediate format between pipelines that group
* reactions together, i.e. by sequence clustering, RO groups, LibMCS clustering, or any other method,
* and pipelines that characterize those grouped reactions with SARs and generalized ROs.
*/
public class ReactionGroupCorpus implements Iterable<ReactionGroup> {
private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper();
static {
OBJECT_MAPPER.enable(SerializationFeature.INDENT_OUTPUT);
}
@JsonProperty
private List<ReactionGroup> reactionGroups;
public ReactionGroupCorpus() {
reactionGroups = new ArrayList<>();
}
public ReactionGroupCorpus(Collection<ReactionGroup> groups) {
reactionGroups = new ArrayList<>(groups);
}
@Override
public Iterator<ReactionGroup> iterator() {
return reactionGroups.iterator();
}
public void printToJsonFile(File outputFile) throws IOException {
try (BufferedWriter writer = new BufferedWriter(new FileWriter(outputFile))) {
OBJECT_MAPPER.writeValue(writer, this);
}
}
public void addGroup(ReactionGroup group) {
reactionGroups.add(group);
}
/**
* Read a ReactionGroupCorpus corpus from file.
*
* @param corpusFile The file to read.
* @return The ReactionGroupCorpus.
* @throws IOException
*/
public static ReactionGroupCorpus loadFromJsonFile(File corpusFile) throws IOException {
return OBJECT_MAPPER.readValue(corpusFile, ReactionGroupCorpus.class);
}
/**
* Read a ReactionGroupCorpus from a text file.
* File should contain DB name on the first line.
* Thereafter each line should have one group of reactions, written as a tab separated list of reaction IDs
*/
public static ReactionGroupCorpus loadFromTextFile(File corpusFile) throws IOException {
ReactionGroupCorpus corpus = new ReactionGroupCorpus();
try (BufferedReader reader = new BufferedReader(new FileReader(corpusFile))) {
String dbName = reader.readLine();
String line;
while ((line = reader.readLine()) != null) {
List<String> fields = Arrays.asList(line.split(","));
ReactionGroup group = new ReactionGroup(fields.get(0), dbName);
for (String idString : fields.subList(1, fields.size())) {
group.addReactionId(Long.parseLong(idString));
}
corpus.addGroup(group);
}
}
return corpus;
}
}