/*******************************************************************************
* Copyright 2007, 2009 Jorge Villalon (jorge.villalon@uai.cl)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*******************************************************************************/
package tml.vectorspace.operations;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import tml.annotators.PennTreeAnnotator;
import tml.utils.StanfordUtils;
import tml.vectorspace.operations.results.RelationshipExtractionResult;
import edu.stanford.nlp.trees.Tree;
/**
* Relationship extraction aims to extract the labeled relationships from a set
* of concepts
*
* @author Jorge Villalon
*
*/
public class RelationshipExtraction extends
AbstractOperation<RelationshipExtractionResult> {
@Override
public void start() throws Exception {
super.start();
List<String> rels = new ArrayList<String>();
for (String passageId : this.corpus.getPassages()) {
Tree pennTree = null;
try {
pennTree = StanfordUtils.getTreeFromString(passageId, repository.getDocumentField(passageId, PennTreeAnnotator.FIELD_NAME));
} catch (IOException e) {
e.printStackTrace();
logger.error(e);
return;
}
List<String> verbs = StanfordUtils.extractVerbs(pennTree);
if(verbs != null)
for (String verb : verbs) {
verb = verb.trim().toLowerCase();
if (rels.contains(verb))
continue;
if (verb.length() == 0)
continue;
rels.add(verb);
}
}
Collections.sort(rels);
for (String verb : rels) {
RelationshipExtractionResult result = new RelationshipExtractionResult();
result.setLinkingWord(verb);
this.results.add(result);
}
super.end();
}
}