/* * Copyright (C) 2008-2015 by Holger Arndt * * This file is part of the Universal Java Matrix Package (UJMP). * See the NOTICE file distributed with this work for additional * information regarding copyright ownership and licensing. * * UJMP is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as * published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * UJMP is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with UJMP; if not, write to the * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor, * Boston, MA 02110-1301 USA */ package org.ujmp.core.text; import java.util.Arrays; import java.util.Collection; import org.ujmp.core.listmatrix.DefaultListMatrix; public class DefaultTextSentence extends DefaultListMatrix<TextToken> implements TextSentence { private static final long serialVersionUID = -1411406267646623488L; private static int sentenceId = 1; public DefaultTextSentence(String sentence) { this(TextUtil.convertSentenceToTextTokens(sentence)); } public DefaultTextSentence(TextToken... textTokens) { this(Arrays.asList(textTokens)); } public DefaultTextSentence(Collection<TextToken> textTokens) { setMetaData(ID, "Sentence" + (sentenceId++)); addAll(textTokens); } public String toString() { StringBuilder sb = new StringBuilder(); for (TextToken token : this) { int i = 0; sb.append(token.getText()); String tag = token.getTag(); if (!"n/a".equals(tag)) { sb.append(" [" + tag + "]"); } if (i++ < size() - 1) { sb.append(" "); } } return sb.toString(); } public String toJson() { StringBuilder sb = new StringBuilder(); sb.append(" {\n"); sb.append(" \"Type\": \"Sentence\",\n"); sb.append(" \"Id\": "); sb.append("\""); sb.append(getMetaData("Id")); sb.append("\",\n"); sb.append(" \"Tokens\":\n"); sb.append(" [\n"); int i = 0; for (TextToken token : this) { sb.append(token.toJson()); if (i++ < size() - 1) { sb.append(",\n"); } } sb.append("\n ]\n"); sb.append(" }"); return sb.toString(); } public boolean setTag(String token, String tag) { boolean tokenFound = false; for (TextToken text : this) { if (token.equals(text.getText())) { if (tokenFound) { throw new RuntimeException("multiple matching tokens found"); } text.setTag(tag); tokenFound = true; } } return tokenFound; } }