package edu.northwestern.at.morphadorner.tools.taggertrainer; /* Please see the license information at the end of this file. */ import java.util.*; import edu.northwestern.at.morphadorner.tools.taggertrainer.*; import edu.northwestern.at.utils.*; /** Tag confusion matrix entry. * * <p> * A TagError entry contains a (correct tag, incorrect tag, error count) * tuple. The error count is the number of times a part of speech * tagger generated "incorrect tag" instead of "correct tag" in * a tagged corpus. A list of TagError entries can be used by a * transformation based learning program to generate contextual rules * to correct the tag errors. * </p> */ public class TagError implements Comparable { /** Correct tag. */ public final String correctTag; /** Incorrect tag. */ public final String incorrectTag; /** List of word positions where this error occurs. */ public final List<Integer> errorPositions; /** Number of times incorrect tag appears instead of correct tag. */ public final int incorrectTagCount; /** The hash code. */ protected final int hashCode; /** Create a tag error entry. * * @param correctTag The correct part of speech tag. * @param incorrectTag The incorrect part of speech tag. * @param errorPositions The list of tag error positions. */ public TagError ( String correctTag , String incorrectTag , List<Integer> errorPositions ) { this.correctTag = correctTag; this.incorrectTag = incorrectTag; this.errorPositions = errorPositions; this.incorrectTagCount = this.errorPositions.size(); // Compute hash code. this.hashCode = this.correctTag.hashCode() ^ this.incorrectTag.hashCode() ^ (new Integer( incorrectTagCount )).hashCode(); } /** Check if another object is equal to this one. * * @param object Other object to test for equality. * * @return true if other object is equal to this one. */ public boolean equals( Object object ) { boolean result = false; if ( ( object != null ) && ( object instanceof TagError ) ) { TagError otherTagError = (TagError)object; result = ( correctTag.equals( otherTagError.correctTag ) ) && ( incorrectTag.equals( otherTagError.incorrectTag ) ) && ( incorrectTagCount == otherTagError.incorrectTagCount ); } return result; } /** Compare this object with another. * * @param object The other object. * * @return < 0 if the other object is less than this one, * = 0 if the two objects are equal, * > 0 if the other object is greater than this one. * * <p> * We use compareTo on the array entries in the key. * This may not give the desired result if the array entries * are themselves arrays. * </p> */ public int compareTo( Object object ) { int result = 0; if ( ( object == null ) || !( object instanceof TagError ) ) { result = Integer.MIN_VALUE; } else { TagError otherTagError = (TagError)object; if ( incorrectTagCount > otherTagError.incorrectTagCount ) { result = -1; } else if ( incorrectTagCount < otherTagError.incorrectTagCount ) { result = 1; } if ( result == 0 ) { result = Compare.compare( incorrectTag , otherTagError.incorrectTag ); } if ( result == 0 ) { result = Compare.compare( correctTag , otherTagError.correctTag ); } } return result; } /** Get the hash code of the keys. * * @return The hash code. */ public int hashCode() { return hashCode; } /** Return a string representation of this object. * * @return A string representation of this object. */ public String toString() { return incorrectTagCount + " " + incorrectTag + " should be " + correctTag; } } /* Copyright (c) 2008, 2009 by Northwestern University. All rights reserved. Developed by: Academic and Research Technologies Northwestern University http://www.it.northwestern.edu/about/departments/at/ Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal with the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimers. * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimers in the documentation and/or other materials provided with the distribution. * Neither the names of Academic and Research Technologies, Northwestern University, nor the names of its contributors may be used to endorse or promote products derived from this Software without specific prior written permission. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH THE SOFTWARE. */