/******************************************************************************* * Copyright (c) 2012 György Orosz, Attila Novák. * All rights reserved. This program and the accompanying materials * are made available under the terms of the GNU Lesser Public License v3 * which accompanies this distribution, and is available at * http://www.gnu.org/licenses/ * * This file is part of PurePos. * * PurePos is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * PurePos is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser Public License for more details. * * Contributors: * György Orosz - initial API and implementation ******************************************************************************/ package hu.ppke.itk.nlpg.purepos.model.internal; import hu.ppke.itk.nlpg.purepos.model.INGram; import java.io.Serializable; import java.util.LinkedList; import java.util.List; import java.util.ListIterator; /** * Standard implementation of the INGram interface, which uses ArrayList for * storing tags * * @author György Orosz * * @param <T> */ public class NGram<T extends Comparable<T>> implements INGram<T>, Serializable { /** * */ private static final long serialVersionUID = 1L; protected final int HASH_NUM = 31; protected final int hashCode; protected final List<T> tokenList; protected final int compareLength; /** * Constructor * * @param tokens * The n-gram elements * @param compareLength * the size of the compare window (used to compare two elements * starting from the end) */ public NGram(List<T> tokens, int compareLength) { this.tokenList = new LinkedList<T>(tokens); this.compareLength = compareLength; this.hashCode = initHashCode(); } public NGram(List<T> tokens, T newElement, int compareLength) { this.compareLength = compareLength; List<T> tmp = new LinkedList<T>(tokens); tmp.add(newElement); this.tokenList = tmp; this.hashCode = initHashCode(); } public NGram(List<T> tokens) { this(tokens, -1); } @Override public NGram<T> add(T e) { return new NGram<T>(tokenList, e, compareLength); } @Override public String toString() { return tokenList.toString(); } @Override public int hashCode() { return hashCode; } public int initHashCode() { int sum = 0; ListIterator<T> thisIterator = tokenList.listIterator(tokenList.size()); int size; if (compareLength != -1) { size = compareLength; } else { size = Integer.MAX_VALUE; } for (int c = 0; thisIterator.hasPrevious() && c < size; ++c) { T act = thisIterator.previous(); sum += act.hashCode() * HASH_NUM; } return sum; } @SuppressWarnings("unchecked") @Override public boolean equals(Object obj) { if (obj instanceof NGram) { return this.compareTo((NGram<T>) obj) == 0; } return false; } @Override public int compareTo(NGram<T> other) { ListIterator<T> thisIterator = tokenList.listIterator(tokenList.size()); ListIterator<T> otherIterator = other.tokenList .listIterator(other.tokenList.size()); int size; if (compareLength != -1) { size = compareLength; } else { size = Integer.MAX_VALUE; } for (int counter = 0; counter < size; ++counter) { if (thisIterator.hasPrevious() && otherIterator.hasPrevious()) { T thisElement = thisIterator.previous(); T otherElement = otherIterator.previous(); int r = thisElement.compareTo(otherElement); if (r != 0) return r; } else if (thisIterator.hasPrevious() && !otherIterator.hasPrevious()) { return 1; } else if (!thisIterator.hasPrevious() && otherIterator.hasPrevious()) { return -1; } else if (!thisIterator.hasPrevious() && !otherIterator.hasPrevious()) { return 0; } } return 0; } @Override public List<T> toList() { return tokenList; } @Override public T getLast() { return tokenList.get(tokenList.size() - 1); } }