TrialUndoParser.java example

Explorer
cdt-tests-runner-master
/*******************************************************************************
 * Copyright (c) 2006, 2008 IBM Corporation and others.
 * All rights reserved. This program and the accompanying materials
 * are made available under the terms of the Eclipse Public License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/legal/epl-v10.html
 *
 * Contributors:
 *     IBM Corporation - initial API and implementation
 *******************************************************************************/
package org.eclipse.cdt.core.dom.lrparser.lpgextensions;

import java.util.LinkedList;

import lpg.lpgjavaruntime.BadParseException;
import lpg.lpgjavaruntime.BadParseSymFileException;
import lpg.lpgjavaruntime.ConfigurationElement;
import lpg.lpgjavaruntime.ConfigurationStack;
import lpg.lpgjavaruntime.Monitor;
import lpg.lpgjavaruntime.NotBacktrackParseTableException;
import lpg.lpgjavaruntime.ParseTable;
import lpg.lpgjavaruntime.TokenStream;

public class TrialUndoParser {
	private Monitor monitor = null;
	private int START_STATE, NUM_RULES, LA_STATE_OFFSET, EOFT_SYMBOL, ERROR_SYMBOL, ACCEPT_ACTION, ERROR_ACTION;

	private TokenStream tokStream;
	private ParseTable prs;
	private ITrialUndoActionProvider actionProvider;
	private boolean skipTokens = false; // true if error productions are used to
										// skip tokens

	private ParserState state;

	/**
	 * Signals that a backtrack was requested by a trial action.
	 */
	private boolean backtrackRequested;

	//
	// Override the getToken function in Stacks.
	//
	public final int getToken(int i) {
		return state.tokens.get(state.parserLocationStack[state.stateStackTop + (i - 1)]);
	}

	public int getTokenOffset() {
		return state.parserLocationStack[state.stateStackTop];
	}

	public final int getCurrentRule() {
		return state.currentAction;
	}

	public final int getFirstToken() {
		return tokStream.getFirstErrorToken(getToken(1));
	}

	public final int getFirstToken(int i) {
		return tokStream.getFirstErrorToken(getToken(i));
	}

	public final int getLastToken() {
		return tokStream.getLastErrorToken(state.lastToken);
	}

	public final int getLastToken(int i) {
		int l = (i >= prs.rhs(state.currentAction) ? state.lastToken : state.tokens.get(state.locationStack[state.stateStackTop + i] - 1));
		return tokStream.getLastErrorToken(l);
	}

	public TrialUndoParser(TokenStream tokStream, ParseTable prs, ITrialUndoActionProvider ra) throws BadParseSymFileException, NotBacktrackParseTableException {
		this.tokStream = tokStream;
		this.prs = prs;
		this.actionProvider = ra;

		START_STATE = prs.getStartState();
		NUM_RULES = prs.getNumRules();
		LA_STATE_OFFSET = prs.getLaStateOffset();
		EOFT_SYMBOL = prs.getEoftSymbol();
		ERROR_SYMBOL = prs.getErrorSymbol();
		ACCEPT_ACTION = prs.getAcceptAction();
		ERROR_ACTION = prs.getErrorAction();

		if (!prs.isValidForParser())
			throw new BadParseSymFileException();
		if (!prs.getBacktrack())
			throw new NotBacktrackParseTableException();
	}

	public TrialUndoParser(Monitor monitor, TokenStream tokStream, ParseTable prs, ITrialUndoActionProvider ra) throws BadParseSymFileException, NotBacktrackParseTableException {
		this(tokStream, prs, ra);
		this.monitor = monitor;
	}

	//
	// Parse without attempting any Error token recovery
	//
	public Object parse() throws BadParseException {
		// without an argument parse() will ignore error productions
		return parse(0);
	}

	//
	// Parse input allowing up to max_error_count Error token recoveries.
	// When max_error_count is 0, no Error token recoveries occur.
	// When max_error is > 0, it limits the number of Error token recoveries.
	// When max_error is < 0, the number of error token recoveries is unlimited.
	// Also, such recoveries only require one token to be parsed beyond the
	// recovery point.
	// (normally two tokens beyond the recovery point must be parsed)
	// Thus, a negative max_error_count should be used when error productions
	// are used to
	// skip tokens.
	//
	public Object parse(int max_error_count) throws BadParseException {
		state = new ParserState(START_STATE, tokStream);
		skipTokens = max_error_count < 0;

		state.pendingCommits = new LinkedList();
		backtrackRequested = false;
		state.trialActionCount = 0;

		// Next "start" token
		state.repair_token = 0;

		int start_token_index = tokStream.peek();
		int start_action_index = 0;

		// Last commit point
		int[] temp_stack = new int[1];
		temp_stack[0] = START_STATE;

		state.reallocateOtherStacks(start_token_index);

		int initial_error_token = backtrackParse(state.repair_token);
		for (int error_token = initial_error_token, count = 0; error_token != 0; error_token = backtrackParse(state.repair_token), count++) {
			if (count == max_error_count)
				throw new BadParseException(initial_error_token);
			state.actionCount = start_action_index;
			tokStream.reset(start_token_index);
			state.stateStackTop = temp_stack.length - 1;
			System.arraycopy(temp_stack, 0, state.stateStack, 0, temp_stack.length);
			state.reallocateOtherStacks(start_token_index);

			backtrackParseUpToError(state.repair_token, error_token);

			for (state.stateStackTop = findRecoveryStateIndex(state.stateStackTop); state.stateStackTop >= 0; state.stateStackTop = findRecoveryStateIndex(state.stateStackTop - 1)) {
				int recovery_token = state.tokens.get(state.locationStack[state.stateStackTop] - 1);
				state.repair_token = errorRepair((recovery_token >= start_token_index ? recovery_token : error_token), error_token);
				if (state.repair_token != 0)
					break;
			}

			if (state.stateStackTop < 0)
				throw new BadParseException(initial_error_token);

			temp_stack = new int[state.stateStackTop + 1];
			System.arraycopy(state.stateStack, 0, temp_stack, 0, temp_stack.length);

			start_action_index = state.actionCount;
			start_token_index = tokStream.peek();
		}

		if (state.repair_token != 0)
			state.tokens.add(state.repair_token);
		int t;
		for (t = start_token_index; tokStream.getKind(t) != EOFT_SYMBOL; t = tokStream.getNext(t))
			state.tokens.add(t);
		state.tokens.add(t);

		return null;
	}

	//
	// Process reductions and continue...
	//
	private int process_backtrack_reductions(int act) {
		do {
			state.stateStackTop -= (prs.rhs(act) - 1);
			trialAction(act);
			if (backtrackRequested) {
				backtrackRequested = false;
				return ERROR_ACTION;
			}
			act = prs.ntAction(state.stateStack[state.stateStackTop], prs.lhs(act));
		} while (act <= NUM_RULES);
		return act;
	}

	//
	// Process reductions and continue...
	//
	private int process_repair_reductions(int act) {
		do {
			System.out.println("process_repair_reductions: " + act);
			state.stateStackTop -= (prs.rhs(act) - 1);
			act = prs.ntAction(state.stateStack[state.stateStackTop], prs.lhs(act));
		} while (act <= NUM_RULES);
		return act;
	}

	//
	// Parse the input until either the parse completes successfully or
	// an error is encountered. This function returns an integer that
	// represents the last action that was executed by the parser. If
	// the parse was succesful, then the tuple "action" contains the
	// successful sequence of actions that was executed.
	//
	private int backtrackParse(int initial_token) {
		//
		// Allocate configuration stack.
		//
		state.configurationStack = new ConfigurationStack(prs);
		state.trialActionStack = new LinkedList<Integer>();
		state.trialActionStack.add(Integer.valueOf(state.trialActionCount));

		//
		// Keep parsing until we successfully reach the end of file or
		// an error is encountered. The list of actions executed will
		// be stored in the "action" tuple.
		//
		int error_token = 0;
		int maxStackTop = state.stateStackTop;
		int start_token = tokStream.peek();
		state.curtok = (initial_token > 0 ? initial_token : tokStream.getToken());
		int current_kind = tokStream.getKind(state.curtok);
		state.act = tAction(state.stateStack[state.stateStackTop], current_kind);

		//
		// The main driver loop
		//
		for (;;) {
			//
			// if the parser needs to stop processing,
			// it may do so here.
			//
			if (monitor != null && monitor.isCancelled())
				return 0;

			state.parserLocationStack[state.stateStackTop] = state.curtok;

			if (state.act <= NUM_RULES) {
				state.actionCount++;
				state.stateStackTop--;
				state.act = process_backtrack_reductions(state.act);
			} else if (state.act > ERROR_ACTION) {
				state.actionCount++;
				state.lastToken = state.curtok;
				state.curtok = tokStream.getToken();
				current_kind = tokStream.getKind(state.curtok);
				state.act = process_backtrack_reductions(state.act - ERROR_ACTION);
			} else if (state.act < ACCEPT_ACTION) {
				state.actionCount++;
				state.lastToken = state.curtok;
				state.curtok = tokStream.getToken();
				current_kind = tokStream.getKind(state.curtok);
			}

			if (state.act == ERROR_ACTION) {
				error_token = (error_token > state.curtok ? error_token : state.curtok);

				ConfigurationElement configuration = state.configurationStack.pop();
				if (configuration == null)
					state.act = ERROR_ACTION;
				else {
					boolean shouldPop = prs.baseAction(configuration.conflict_index) == 0;
					undoActions(shouldPop);
					state.actionCount = configuration.action_length;
					state.act = configuration.act;
					state.curtok = configuration.curtok;
					current_kind = tokStream.getKind(state.curtok);
					tokStream.reset(state.curtok == initial_token ? start_token : tokStream.getNext(state.curtok));
					state.stateStackTop = configuration.stack_top;
					configuration.retrieveStack(state.stateStack);
					continue;
				}
				break;
			}
			if (state.act > ACCEPT_ACTION && state.act != ERROR_ACTION) {
				if (state.configurationStack.findConfiguration(state.stateStack, state.stateStackTop, state.curtok))
					state.act = ERROR_ACTION;
				else {
					state.configurationStack.push(state.stateStack, state.stateStackTop, state.act + 1, state.curtok, state.actionCount);
					state.trialActionStack.add(Integer.valueOf(state.trialActionCount));
					state.act = prs.baseAction(state.act);
					maxStackTop = state.stateStackTop > maxStackTop ? state.stateStackTop : maxStackTop;
				}
				continue;
			} else if (state.act == ACCEPT_ACTION) {
				break;
			}
			try {
				state.stateStack[++state.stateStackTop] = state.act;
			} catch (IndexOutOfBoundsException e) {
				state.reallocateStateStack();
				state.stateStack[state.stateStackTop] = state.act;
			}

			state.act = tAction(state.act, current_kind);
		}

		// System.out.println("****Number of configurations: " +
		// configuration_stack.configurationSize());
		// System.out.println("****Number of elements in stack tree: " +
		// configuration_stack.numStateElements());
		// System.out.println("****Number of elements in stacks: " +
		// configuration_stack.stacksSize());
		// System.out.println("****Number of actions: " + action.size());
		// System.out.println("****Max Stack Size = " + maxStackTop);
		// System.out.flush();
		return (state.act == ERROR_ACTION ? error_token : 0);
	}

	private void backtrackParseUpToError(int initial_token, int error_token) {
		//
		// Allocate configuration stack.
		//
		state.configurationStack = new ConfigurationStack(prs);
		state.trialActionStack = new LinkedList<Integer>();
		state.trialActionStack.add(Integer.valueOf(state.trialActionCount));

		//
		// Keep parsing until we successfully reach the end of file or
		// an error is encountered. The list of actions executed will
		// be stored in the "action" tuple.
		//

		// tokStream.reset(initial_token);
		int start_token = tokStream.peek();
		state.curtok = (initial_token > 0 ? initial_token : tokStream.getToken());
		int current_kind = tokStream.getKind(state.curtok);
		state.act = tAction(state.stateStack[state.stateStackTop], current_kind);

		state.tokens.add(state.curtok);
		state.locationStack[state.stateStackTop] = state.tokens.size();
		state.actionStack[state.stateStackTop] = state.actionCount;
		state.undoStack[state.stateStackTop] = state.trialActionCount;

		for (;;) {
			//
			// if the parser needs to stop processing,
			// it may do so here.
			//
			if (monitor != null && monitor.isCancelled())
				return;

			state.parserLocationStack[state.stateStackTop] = state.curtok;

			if (state.act <= NUM_RULES) {
				state.actionCount++;
				state.stateStackTop--;
				state.act = process_backtrack_reductions(state.act);
			} else if (state.act > ERROR_ACTION) {
				state.actionCount++;
				state.lastToken = state.curtok;
				state.curtok = tokStream.getToken();
				current_kind = tokStream.getKind(state.curtok);
				state.tokens.add(state.curtok);
				state.act = process_backtrack_reductions(state.act - ERROR_ACTION);
			} else if (state.act < ACCEPT_ACTION) {
				state.actionCount++;
				state.lastToken = state.curtok;
				state.curtok = tokStream.getToken();
				current_kind = tokStream.getKind(state.curtok);
				state.tokens.add(state.curtok);
			} else if (state.act == ERROR_ACTION) {
				if (state.curtok != error_token) {
					ConfigurationElement configuration = state.configurationStack.pop();
					if (configuration == null)
						state.act = ERROR_ACTION;
					else {
						boolean shouldPop = prs.baseAction(configuration.conflict_index) == 0;
						undoActions(shouldPop);
						state.actionCount = configuration.action_length;
						state.act = configuration.act;
						int next_token_index = configuration.curtok;
						state.tokens.reset(next_token_index);
						state.curtok = state.tokens.get(next_token_index - 1);
						current_kind = tokStream.getKind(state.curtok);
						tokStream.reset(state.curtok == initial_token ? start_token : tokStream.getNext(state.curtok));
						state.stateStackTop = configuration.stack_top;
						configuration.retrieveStack(state.stateStack);
						state.locationStack[state.stateStackTop] = state.tokens.size();
						state.actionStack[state.stateStackTop] = state.actionCount;
						state.undoStack[state.stateStackTop] = state.trialActionCount;
						continue;
					}
				}
				break;
			} else if (state.act > ACCEPT_ACTION) {
				if (state.configurationStack.findConfiguration(state.stateStack, state.stateStackTop, state.tokens.size()))
					state.act = ERROR_ACTION;
				else {
					state.configurationStack.push(state.stateStack, state.stateStackTop, state.act + 1, state.tokens.size(), state.actionCount);
					state.trialActionStack.add(Integer.valueOf(state.trialActionCount));
					state.act = prs.baseAction(state.act);
				}
				continue;
			} else
				break; // assert(act == ACCEPT_ACTION);

			state.stateStack[++state.stateStackTop] = state.act; // no need
																	// to check
																	// if out of
																	// bounds
			state.locationStack[state.stateStackTop] = state.tokens.size();
			state.actionStack[state.stateStackTop] = state.actionCount;
			state.undoStack[state.stateStackTop] = state.trialActionCount;
			state.act = tAction(state.act, current_kind);
		}

		// assert(curtok == error_token);

		return;
	}

	private boolean repairable(int error_token) {
		//
		// Allocate configuration stack.
		//
		ConfigurationStack configuration_stack = new ConfigurationStack(prs);

		//
		// Keep parsing until we successfully reach the end of file or
		// an error is encountered. The list of actions executed will
		// be stored in the "action" tuple.
		//
		int start_token = tokStream.peek();
		int final_token = tokStream.getStreamLength(); // unreachable
		int curtok = 0;
		int current_kind = ERROR_SYMBOL;
		int act = tAction(state.stateStack[state.stateStackTop], current_kind);

		for (;;) {
			if (act <= NUM_RULES) {
				state.stateStackTop--;
				act = process_repair_reductions(act);
			} else if (act > ERROR_ACTION) {
				curtok = tokStream.getToken();
				if (curtok > final_token)
					return true;
				current_kind = tokStream.getKind(curtok);
				act = process_repair_reductions(act - ERROR_ACTION);
			} else if (act < ACCEPT_ACTION) {
				curtok = tokStream.getToken();
				if (curtok > final_token)
					return true;
				current_kind = tokStream.getKind(curtok);
			} else if (act == ERROR_ACTION) {
				ConfigurationElement configuration = configuration_stack.pop();
				if (configuration == null)
					act = ERROR_ACTION;
				else {
					state.stateStackTop = configuration.stack_top;
					configuration.retrieveStack(state.stateStack);
					act = configuration.act;
					curtok = configuration.curtok;
					if (curtok == 0) {
						current_kind = ERROR_SYMBOL;
						tokStream.reset(start_token);
					} else {
						current_kind = tokStream.getKind(curtok);
						tokStream.reset(tokStream.getNext(curtok));
					}
					continue;
				}
				break;
			} else if (act > ACCEPT_ACTION) {
				if (configuration_stack.findConfiguration(state.stateStack, state.stateStackTop, curtok))
					act = ERROR_ACTION;
				else {
					configuration_stack.push(state.stateStack, state.stateStackTop, act + 1, curtok, 0);
					act = prs.baseAction(act);
				}
				continue;
			} else
				break; // assert(act == ACCEPT_ACTION);
			try {
				//
				// We consider a configuration to be acceptable for recovery
				// if we are able to consume enough symbols in the remaining
				// tokens to reach another potential recovery point past the
				// original error token.
				//
				if ((curtok > error_token) && (final_token == tokStream.getStreamLength())) {
					//
					// If the ERROR_SYMBOL is a valid Action Adjunct in the
					// state
					// "act" then we set the terminating token as the successor
					// of
					// the current token. I.e., we have to be able to parse at
					// least
					// two tokens past the re-synch point before we claim
					// victory.
					//
					if (recoverableState(act))
						final_token = skipTokens ? curtok : tokStream.getNext(curtok);
				}

				state.stateStack[++state.stateStackTop] = act;
			} catch (IndexOutOfBoundsException e) {
				state.reallocateStateStack();
				state.stateStack[state.stateStackTop] = act;
			}

			act = tAction(act, current_kind);
		}

		//
		// If we can reach the end of the input successfully, we claim victory.
		//
		return (act == ACCEPT_ACTION);
	}

	private boolean recoverableState(int state) {
		for (int k = prs.asi(state); prs.asr(k) != 0; k++) {
			if (prs.asr(k) == ERROR_SYMBOL)
				return true;
		}
		return false;
	}

	private int findRecoveryStateIndex(int start_index) {
		int i;
		for (i = start_index; i >= 0; i--) {
			//
			// If the ERROR_SYMBOL is an Action Adjunct in state stateStack[i]
			// then chose i as the index of the state to recover on.
			//
			if (recoverableState(state.stateStack[i]))
				break;
		}

		if (i >= 0) // if a recoverable state, remove null reductions, if any.
		{
			int k;
			for (k = i - 1; k >= 0; k--) {
				if (state.locationStack[k] != state.locationStack[i])
					break;
			}
			i = k + 1;
		}

		return i;
	}

	private int errorRepair(int recovery_token, int error_token) {
		int temp_stack[] = new int[state.stateStackTop + 1];
		System.arraycopy(state.stateStack, 0, temp_stack, 0, temp_stack.length);
		for (; tokStream.getKind(recovery_token) != EOFT_SYMBOL; recovery_token = tokStream.getNext(recovery_token)) { 
			System.out.println("recovery token: " + tokStream.getKind(recovery_token)); //$NON-NLS-1$
			tokStream.reset(recovery_token);
			if (repairable(error_token))
				break;
			state.stateStackTop = temp_stack.length - 1;
			System.arraycopy(temp_stack, 0, state.stateStack, 0, temp_stack.length);
		}

		if (tokStream.getKind(recovery_token) == EOFT_SYMBOL) {
			tokStream.reset(recovery_token);
			if (!repairable(error_token)) {
				state.stateStackTop = temp_stack.length - 1;
				System.arraycopy(temp_stack, 0, state.stateStack, 0, temp_stack.length);
				return 0;
			}
		}

		state.stateStackTop = temp_stack.length - 1;
		System.arraycopy(temp_stack, 0, state.stateStack, 0, temp_stack.length);

		undoActions(state.undoStack[state.stateStackTop]);
		tokStream.reset(recovery_token);
		state.tokens.reset(state.locationStack[state.stateStackTop] - 1);
		state.actionCount = state.actionStack[state.stateStackTop];
		state.trialActionCount = state.undoStack[state.stateStackTop];

		return tokStream.makeErrorToken(state.tokens.get(state.locationStack[state.stateStackTop] - 1), tokStream.getPrevious(recovery_token), error_token, ERROR_SYMBOL);
	}

	private int tAction(int act, int sym) {
		act = prs.tAction(act, sym);
		if (act > LA_STATE_OFFSET) {
			int next_token = tokStream.peek();
			act = prs.lookAhead(act - LA_STATE_OFFSET, tokStream.getKind(next_token));
			while (act > LA_STATE_OFFSET) {
				next_token = tokStream.getNext(next_token);
				act = prs.lookAhead(act - LA_STATE_OFFSET, tokStream.getKind(next_token));
			}
		}
		return act;
	}

	private void trialAction(int action) {
		int start = getTokenOffset();
		int end = getLastToken();
		Rule rule = new Rule(action, start, end);

		actionProvider.setActiveRule(rule);
		boolean saveAction = actionProvider.trialAction(action);
		if (backtrackRequested) {
			return;
		}
		if (saveAction) {
			state.trialActionCount++;
			state.pendingCommits.add(rule);
		}
	}

	/**
	 * Performs the undo actions (in reverse order) for the corresponding trial
	 * actions that have been executed since the last backtrackable point.
	 */
	private void undoActions(boolean shouldPop) {
		int oldTrialActionCount;
		if (state.trialActionStack.size() == 0) {
			oldTrialActionCount = 0;
		} else {
			oldTrialActionCount = state.trialActionStack.getLast();
			if (shouldPop) {
				state.trialActionStack.removeLast();
			}
		}
		safeUndoActions(oldTrialActionCount);

		// needs to be a real checked exception if we ever decide to implement commits
		//assert (state.trialActionCount == 0 && oldTrialActionCount == 0) || oldTrialActionCount != state.trialActionCount : "Went back in time too far";
	}

	private void safeUndoActions(int total) {
		assert total >= 0 : "Tried to go back in time but the door was already shut."; //$NON-NLS-1$
		undoActions(total);
	}

	private void undoActions(int total) {
		while (state.trialActionCount > total) {
			Rule action = ((Rule) state.pendingCommits.removeLast());
			actionProvider.setActiveRule(action);
			actionProvider.undoAction(action.getRuleNumber());
			state.trialActionCount--;
		}
	}

	public void backtrack() {
		backtrackRequested = true;
	}

	public void commit() {
		while (state.pendingCommits.size() > 0) {
			Rule activeRule = (Rule) state.pendingCommits.removeFirst();
			actionProvider.setActiveRule(activeRule);
			actionProvider.finalAction(activeRule.getRuleNumber());
			state.totalCommits++;
		}
	}
}