TexSpellDictionary.java example

Explorer

texlipse-master
- source
  - net
    - sourceforge
      - texlipse
        DDEClient.java
        PathUtils.java
        SelectedResourceManager.java
        TexPerspectiveFactory.java
        TexlipsePlugin.java
        actions
        AbstractTexSelectionChange.java
        ForceRebuildAction.java
        GoToMatchingBracketAction.java
        InputQueryDialog.java
        OpenDeclarationAction.java
        PartialBuildAction.java
        PreviewAction.java
        RunBibTeXOnNextBuildAction.java
        SaveAsTemplateAction.java
        SetMainFileAction.java
        TexCollapseAction.java
        TexComment.java
        TexCorrectIndentationAction.java
        TexHardLineWrapAction.java
        TexInsertMathSymbolAction.java
        TexSelections.java
        TexUncollapseAction.java
        TexUncomment.java
        TexWordWrapAction.java
        WordCountAction.java
        auxparser
        AuxFileParser.java
        bibeditor
        AbbrevManager.java
        BibBraceRule.java
        BibCodeFolder.java
        BibCodeScanner.java
        BibColorProvider.java
        BibCommandRule.java
        BibCompletionProcessor.java
        BibContentProvider.java
        BibDocumentModel.java
        BibEditor.java
        BibEntryScanner.java
        BibLabelProvider.java
        BibOutlinePage.java
        BibPartitionScanner.java
        BibProjectionAnnotation.java
        BibSetupParticipant.java
        BibSourceViewerConfiguration.java
        BibStringCompleter.java
        BibStringRule.java
        bibparser
        AbbrevRetriever.java
        BibFileReferenceSearch.java
        BibLexer.java
        BibOutlineContainer.java
        BibParser.java
        EntryRetriever.java
        analysis
        Analysis.java
        AnalysisAdapter.java
        DepthFirstAdapter.java
        ReversedDepthFirstAdapter.java
        lexer
        Lexer.java
        LexerException.java
        node
        ABibeBibEntry.java
        ABibstreBibEntry.java
        ABibtaskBibEntry.java
        ABibtex.java
        AConcat.java
        AEntryDef.java
        AEntrybraceEntry.java
        AEntryparenEntry.java
        AIdValOrSid.java
        AKeyvalDecl.java
        ANumValOrSid.java
        AStrbraceStringEntry.java
        AStrparenStringEntry.java
        AValueBValOrSid.java
        AValueQValOrSid.java
        EOF.java
        Node.java
        PBibEntry.java
        PBibtex.java
        PConcat.java
        PEntry.java
        PEntryDef.java
        PKeyvalDecl.java
        PStringEntry.java
        PValOrSid.java
        Start.java
        Switch.java
        Switchable.java
        TBString.java
        TComma.java
        TComment.java
        TEntryName.java
        TEquals.java
        TEstring.java
        TIdentifier.java
        TLBrace.java
        TLParen.java
        TNumber.java
        TPreamble.java
        TQuotec.java
        TRBrace.java
        TRParen.java
        TScribeComment.java
        TSharp.java
        TStringLiteral.java
        TTaskcomment.java
        TWhitespace.java
        Token.java
        parser
        Parser.java
        ParserException.java
        State.java
        TokenIndex.java
        builder
        AbstractBuilder.java
        AbstractProgramRunner.java
        AdaptableBuilder.java
        BiberRunner.java
        BibtexRunner.java
        Builder.java
        BuilderChooser.java
        BuilderCoreException.java
        BuilderRegistry.java
        DviBuilder.java
        DvipdfRunner.java
        DvipsRunner.java
        ExternalProgram.java
        Kpath.java
        KpsewhichRunner.java
        LatexRunner.java
        LualatexRunner.java
        MakeindexNomenclRunner.java
        MakeindexRunner.java
        OutputFileManager.java
        OutputScanner.java
        PdflatexRunner.java
        ProgramRunner.java
        ProjectFileTracking.java
        Ps2pdfRunner.java
        PsBuilder.java
        PslatexRunner.java
        TexBuilder.java
        TexlipseBuilder.java
        TexlipseNature.java
        XelatexRunner.java
        editor
        BracketInserter.java
        ColorManager.java
        HardLineWrap.java
        TeXSpellingReconcileStrategy.java
        TexAnnotationHover.java
        TexAutoIndentStrategy.java
        TexCodeFolder.java
        TexCompletionProcessor.java
        TexCompletionProposal.java
        TexDocumentParseException.java
        TexDocumentProvider.java
        TexDocumentSetupParticipant.java
        TexEditor.java
        TexEditorActionContributor.java
        TexEditorTools.java
        TexMathCompletionProcessor.java
        TexPairMatcher.java
        TexProjectionAnnotation.java
        TexQuoteListener.java
        TexSourceViewerConfiguration.java
        TexlipseAnnotationUpdater.java
        hover
        TexHover.java
        TexHoverControlCreator.java
        TexInformationControl.java
        partitioner
        BufferedDocumentScanner.java
        FastLaTeXPartitionScanner.java
        scanner
        TexArgScanner.java
        TexCommentScanner.java
        TexEnvironmentRule.java
        TexMathScanner.java
        TexOptArgScanner.java
        TexScanner.java
        TexSpecialCharRule.java
        TexTikzScanner.java
        TexWord.java
        TextWords.java
        WhitespaceDetector.java
        extension
        BibOutlineActionProvider.java
        BibProvider.java
        model
        AbstractEntry.java
        CommandEntry.java
        DocumentReference.java
        MarkerHandler.java
        OutlineNode.java
        ParseErrorMessage.java
        PartialRetriever.java
        ReferenceContainer.java
        ReferenceEntry.java
        ReferenceManager.java
        TexCommandContainer.java
        TexCommandEntry.java
        TexDocumentModel.java
        TexOutlineInput.java
        TexProjectParser.java
        TexStyleCompletionManager.java
        outline
        TexContentProvider.java
        TexLabelProvider.java
        TexOutlineActionCopy.java
        TexOutlineActionCut.java
        TexOutlineActionDelete.java
        TexOutlineActionPaste.java
        TexOutlineActionUpdate.java
        TexOutlineDNDAdapter.java
        TexOutlineFilter.java
        TexOutlineNodeComparer.java
        TexOutlinePage.java
        TexProjectOutline.java
        properties
        BibColoringPreferencePage.java
        BibDirectoriesPreferencePage.java
        BibtexPreferencePage.java
        BuilderConfigDialog.java
        BuilderEnvPreferencePage.java
        BuilderSettingsPreferencePage.java
        KeyValueListFieldEditor.java
        LatexTempExtsPreferencePage.java
        ProjectTemplatesPreferencePage.java
        StringListFieldEditor.java
        TexlipseHelpIds.java
        TexlipsePreferenceInitializer.java
        TexlipsePreferencePage.java
        TexlipseProjectPropertyPage.java
        TexlipseProperties.java
        ViewerEnvPreferencePage.java
        ViewerListFieldEditor.java
        ViewerSettingsPreferencePage.java
        editor
        CodeFoldingPreferencePage.java
        ColoringPreferencePage.java
        IndentationPreferencePage.java
        OutlinePreferencePage.java
        SmartKeyPreferencePage.java
        StyleCompletionPreferencePage.java
        StyleListFieldEditor.java
        TexEditorPreferencePage.java
        spelling
        AddToDictProposal.java
        IgnoreProposal.java
        SpellCheckAction.java
        SpellChecker.java
        SpellCheckerEnvPreferencePage.java
        SpellCheckerPreferencePage.java
        SpellUncheckAction.java
        SpellingCompletionProposal.java
        SpellingMarkerResolution.java
        SpellingResolutionGenerator.java
        TexSpellDictionary.java
        TexSpellingEngine.java
        TexlipseWordFinder.java
        tableview
        views
        ITexRowListViewer.java
        TexCellListener.java
        TexCellModifier.java
        TexRow.java
        TexRowList.java
        TexTableView.java
        templates
        BibTexContextType.java
        BibTexTemplateCompletion.java
        BibTexTemplatePreferencesPage.java
        CompletionProposalComparator.java
        ProjectTemplateManager.java
        ProposalsComparator.java
        TexContextType.java
        TexTemplateCompletion.java
        TexTemplatePreferencesPage.java
        texparser
        LatexLexer.java
        LatexParser.java
        LatexParserUtils.java
        LatexRefExtractingParser.java
        LatexWordCounter.java
        TexParser.java
        analysis
        Analysis.java
        AnalysisAdapter.java
        lexer
        Lexer.java
        LexerException.java
        node
        EOF.java
        Node.java
        Switch.java
        Switchable.java
        TArgument.java
        TBverbatim.java
        TCbegin.java
        TCbib.java
        TCbibstyle.java
        TCchapter.java
        TCcite.java
        TCend.java
        TCinclude.java
        TCinput.java
        TClabel.java
        TCnew.java
        TCommentline.java
        TCpackage.java
        TCparagraph.java
        TCpart.java
        TCpbib.java
        TCpindex.java
        TCref.java
        TCrenew.java
        TCsection.java
        TCspace.java
        TCssection.java
        TCsssection.java
        TCsymbol.java
        TCverb.java
        TCword.java
        TEverbatim.java
        TLBrace.java
        TLBracket.java
        TOptargument.java
        TRBrace.java
        TRBracket.java
        TSkippedArea.java
        TStar.java
        TTaskcomment.java
        TVtext.java
        TWhitespace.java
        TWord.java
        Token.java
        treeview
        views
        TexOutlineTreeView.java
        ui
        KpathseaProvider.java
        viewer
        TexLaunchConfigurationDelegate.java
        TexLaunchConfigurationTab.java
        TexLaunchConfigurationTabGroup.java
        ViewerAttributeRegistry.java
        ViewerConfigDialog.java
        ViewerManager.java
        ViewerOutputScanner.java
        util
        FileLocationClient.java
        FileLocationListener.java
        FileLocationServer.java
        ViewerErrorScanner.java
        wizards
        TexlipseNewTexFileWizard.java
        TexlipseNewTexFileWizardPage.java
        TexlipseProjectAttributes.java
        TexlipseProjectCreationOperation.java
        TexlipseProjectCreationWizard.java
        TexlipseProjectCreationWizardPage.java
        TexlipseProjectFilesWizardPage.java
        TexlipseWizardPage.java

/*
 * $Id$
 *
 * Copyright (c) 2004-2010 by the TeXlapse Team.
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the Eclipse Public License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/legal/epl-v10.html
 */
package net.sourceforge.texlipse.spelling;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.Reader;
import java.io.Writer;
import java.util.ArrayList;
import java.util.Collection;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.StringTokenizer;

import com.swabunga.spell.engine.SpellDictionaryASpell;

/**
 * A memory optimized dictionary class 
 * @author Boris von Loesch
 *
 */
public class TexSpellDictionary extends SpellDictionaryASpell {
    private final static int INITIAL_CAPACITY = 32 * 1024;

    private final static char SEP_CHAR = ';';
    
    protected Map<Integer, StringBuilder> mainDictionary = new HashMap<Integer, StringBuilder>(INITIAL_CAPACITY);

    /**
     * User dictionary
     */
    private File dictFile = null;


    /**
     * Dictionary Constructor.
     * @param wordList The file containing the words list for the dictionary
     * @throws java.io.IOException indicates problems reading the words list
     * file
     */
    public TexSpellDictionary(Reader wordList) throws IOException {
        super((File) null);
        createDictionary(new BufferedReader(wordList));
    }

    /**
     * Dictionary constructor that uses an aspell phonetic file to
     * build the transformation table.
     * @param wordList The file containing the words list for the dictionary
     * @param phonetic The reader to use for phonetic transformation of the 
     * wordlist.
     * @throws java.io.IOException indicates problems reading the words list
     * or phonetic information
     */
    public TexSpellDictionary(Reader wordList, Reader phonetic) throws IOException {
        super(phonetic);
        createDictionary(new BufferedReader(wordList));
    }
    
    /**
     * Add words from a file to existing dictionary hashmap.
     * This function can be called as many times as needed to
     * build the internal word list. Duplicates are not added.
     * <p>
     * Note that adding a dictionary does not affect the target
     * dictionary file for the addWord method. That is, addWord() continues
     * to make additions to the dictionary file specified in createDictionary()
     * <P>
     * @param wordList a File object that contains the words, on word per line.
     * @throws FileNotFoundException
     * @throws IOException
     */
    public void addDictionary(File wordList) throws FileNotFoundException, IOException {
        addDictionaryHelper(new BufferedReader(new FileReader(wordList)));
    }

    /**
     * Set the user dictionary file
     * @param userDict
     */
    public void setUserDict(File userDict) {
        dictFile = userDict;
        try {
            addDictionary(userDict);
        } catch (IOException e) {
            //Do nothing
        }
    }

    /**
     * Add a word permanently to the dictionary (and the dictionary file).
     * <p>This needs to be made thread safe (synchronized)</p>
     */
    public void addWord(String word) {
        putWordUnique(word);
        if (dictFile == null) return;
        try {
            if (!dictFile.exists()) {
                boolean succ = dictFile.createNewFile();
                if (!succ) return;
            }
            Writer w = new FileWriter(dictFile.toString(), true);
            // Open with append.
            w.write(word);
            w.write("\n");
            w.close();
        } catch (IOException ex) {
        }            
    }

    /**
     * Constructs the dictionary from a word list file.
     * <p>
     * Each word in the reader should be on a separate line.
     * <p>
     * This is a very slow function. On my machine it takes quite a while to
     * load the data in. I suspect that we could speed this up quite allot.
     */
    protected void createDictionary(BufferedReader in) throws IOException {
        String line;
        while ((line = in.readLine()) != null) {
            if (line.length() > 0) {
                putWord(line.trim());
            }
        }
    }

    /**
     * Adds to the existing dictionary from a word list file. If the word
     * already exists in the dictionary, a new entry is not added.
     * <p>
     * Each word in the reader should be on a separate line.
     * <p>
     * Note: for whatever reason that I haven't yet looked into, the phonetic codes
     * for a particular word map to a vector of words rather than a hash table.
     * This is a drag since in order to check for duplicates you have to iterate
     * through all the words that use the phonetic code.
     * If the vector-based implementation is important, it may be better
     * to subclass for the cases where duplicates are bad.
     */
    public void addDictionaryHelper(BufferedReader in) throws IOException {
        String line;
        while ((line = in.readLine()) != null) {
            if (line.length() > 0) {
                putWordUnique(line.trim());
            }
        }
    }

    /**
     * Allocates a word in the dictionary
     * @param word The word to add
     */
    protected void putWord(String word) {
        int code = getCode(word).hashCode();
        StringBuilder words = mainDictionary.get(code);
        if (words != null) {
            words.append(word);
            words.append(SEP_CHAR);
        } else {
            words = new StringBuilder();
            words.append(SEP_CHAR);
            words.append(word);
            words.append(SEP_CHAR);
            mainDictionary.put(code, words);
        }
    }

    /**
     * Allocates a word, if it is not already present in the dictionary. A word
     * with a different case is considered the same.
     * @param word The word to add
     */
    protected void putWordUnique(String word) {

        int code = getCode(word).hashCode();
        StringBuilder words = mainDictionary.get(code);

        if (words != null) {
            if (words.indexOf(SEP_CHAR + word + SEP_CHAR) == -1) {
                words.append(word);
                words.append(SEP_CHAR);            
            }
            //else the word is already in the dictionary
        }
        else {
            words = new StringBuilder();
            words.append(SEP_CHAR);
            words.append(word);
            words.append(SEP_CHAR);
            mainDictionary.put(code, words);
        }
    }

    /**
     * Compresses the dictionary so that it takes less memory
     */
    public void compress() {
        Collection<StringBuilder> c = mainDictionary.values();
        for (StringBuilder st : c) {
            st.trimToSize();
        }
    }
    
    /**
     * Returns a list of strings (words) for the code.
     */
    @Override
    public List<String> getWords(String code) {
        //Check the main dictionary.
        StringBuilder mainDictResult = mainDictionary.get(code.hashCode());
        if (mainDictResult == null) return new ArrayList<String>(1);
        StringTokenizer stk = new StringTokenizer(mainDictResult.toString(), ""+SEP_CHAR);
        List<String> list = new ArrayList<String>(1);
        while (stk.hasMoreTokens()) list.add(stk.nextToken());
        return list;
    }

    /**
     * Returns true if the word is correctly spelled against the current word list.
     */
    @Override
    public boolean isCorrect(String word) {
        StringBuilder words = mainDictionary.get(getCode(word).hashCode());
        if (words == null) return false;
        if (words.indexOf(SEP_CHAR + word + SEP_CHAR) >= 0) return true;
        //JMH should we always try the lowercase version. If I dont then capitalised
        //words are always returned as incorrect.
        if (words.indexOf(SEP_CHAR + word.toLowerCase() + SEP_CHAR) >= 0) return true;
        return false;
    }

}