ParallelExecutor.java example

Explorer
jop-master
/*
  This file is part of JOP, the Java Optimized Processor
    see <http://www.jopdesign.com/>

  Copyright (C) 2009, Martin Schoeberl (martin@jopdesign.com)

  This program is free software: you can redistribute it and/or modify
  it under the terms of the GNU General Public License as published by
  the Free Software Foundation, either version 3 of the License, or
  (at your option) any later version.

  This program is distributed in the hope that it will be useful,
  but WITHOUT ANY WARRANTY; without even the implied warranty of
  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  GNU General Public License for more details.

  You should have received a copy of the GNU General Public License
  along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/


/**
 *
 */
package cmp;

import com.jopdesign.io.IOFactory;
import com.jopdesign.io.SysDevice;
import com.jopdesign.sys.Startup;

/**
 * A minimal framework for work distribution to the CMP cores.
 *
 * @author Martin Schoeberl (martin@jopdesign.com)
 *
 */
public class ParallelExecutor {

	private class Runner implements Runnable {

		volatile boolean finished;
		Execute ex;

		public Runner() {
			finished = true;
		}

		void setExecute(Execute e) {
			ex = e;
		}

		public void run() {
			for (;;) {
				if (cnt<size && !finished) {
					int i;
					synchronized(ex) {
						i = cnt++;
					}
					if (i<size) {
						ex.execute(i);
					}
				} else {
					finished = true;
				}
			}
		}

	}

	private volatile int cnt;
	private volatile int size;
	private Runner runner[];
	SysDevice sys = IOFactory.getFactory().getSysDevice();

	public ParallelExecutor() {

		runner = new Runner[sys.nrCpu-1];
		for (int i=0; i<sys.nrCpu-1; i++) {
			runner[i] = new Runner();
			Startup.setRunnable(runner[i], i);
		}
		// we already start all cores here
		sys.signal = 1;
	}

	public void executeParallel(Execute e, int size) {

		this.size = size;
		cnt = 0;

		// distribute the work to all cores.
		                                    //rup: setting 12 cores as max to avoid changing all the time
		for (int i=0; i<sys.nrCpu-1; ++i) { //@WCA loop=12
			runner[i].setExecute(e);
			runner[i].finished = false;
		}
		// do also some work
		                   //number of data points
		while (cnt<size) { //@WCA loop=14
			int i;
			synchronized(e) {
				i = cnt++;
			}
			if (i<size) {
				e.execute(i);
			}
		}
		// now wait for others finishing their work
		boolean allFinished;

		do {
			allFinished = true;                 //rup: setting 12 cores as max to avoid changing all the time
			for (int i=0; i<sys.nrCpu-1; ++i) { //@WCA loop=12
				allFinished &= runner[i].finished;
			}                   // rup: this is tricky, how to model it martin?
		} while (!allFinished); //@WCA loop=100
		// now we can return


		// that would be a serial version for tests:
//		for (int i=0; i<size; ++i) {
//			e.execute(i);
//		}
	}
	/**
	 * @param args
	 */
	public static void main(String[] args) {

		Execute e = new Test();
		ParallelExecutor pe = new ParallelExecutor();
		pe.executeParallel(e, Test.N);
		Test.result();
	}

	private static class Test implements Execute {

		final static int N = 100;
		static int a[] = new int[N];

		public void execute(int nr) {
			a[nr] = IOFactory.getFactory().getSysDevice().cpuId+1;
		}

		public static void result() {
			for (int i=0; i<N; ++i) {
				System.out.println(a[i]);
			}
		}
	}


}