/** * Copyright © 2013 enioka. All rights reserved * Authors: Marc-Antoine GOUILLART (marc-antoine.gouillart@enioka.com) * Pierre COPPEE (pierre.coppee@enioka.com) * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.enioka.jqm.tools; import java.io.File; import java.lang.management.ManagementFactory; import java.net.MalformedURLException; import java.util.Calendar; import java.util.GregorianCalendar; import java.util.HashMap; import java.util.Locale; import java.util.Map; import java.util.Properties; import javax.management.MBeanServer; import javax.management.ObjectName; import org.apache.commons.io.FileUtils; import org.apache.commons.io.FilenameUtils; import org.apache.commons.lang.StringUtils; import org.apache.log4j.Logger; import com.enioka.jqm.api.JqmClientFactory; import com.enioka.jqm.jdbc.DbConn; import com.enioka.jqm.jdbc.QueryResult; import com.enioka.jqm.model.History; import com.enioka.jqm.model.JobInstance; import com.enioka.jqm.model.Node; import com.enioka.jqm.model.RuntimeParameter; import com.enioka.jqm.model.State; /** * The loader is the tracker object for a payload execution. The job thread starts here and ends here. This class handles logging (creation * of {@link History}),starting the payload, etc. */ class Loader implements Runnable, LoaderMBean { private Logger jqmlogger = Logger.getLogger(Loader.class); private JobInstance job = null; private Node node = null; private final QueuePoller p; private final JqmEngine engine; private final ClassloaderManager clm; private ObjectName name = null; private ClassLoader classLoaderToRestoreAtEnd = null; Boolean isDone = false, isDelayed = false; private String threadName; // These two fields are instance-level in order to allow an easy endOfRunDb external call private Calendar endDate = null; private State resultStatus = State.ATTRIBUTED; Loader(JobInstance job, JqmEngine engine, QueuePoller p, ClassloaderManager clm) { this.p = p; this.engine = engine; this.clm = clm; this.job = job; this.threadName = this.job.getJD().getApplicationName() + ";payload;" + this.job.getId(); // JMX if (p != null && this.p.getEngine().loadJmxBeans) { MBeanServer mbs = ManagementFactory.getPlatformMBeanServer(); try { name = new ObjectName("com.enioka.jqm:type=Node.Queue.JobInstance,Node=" + this.p.getEngine().getNode().getName() + ",Queue=" + this.p.getQueue().getName() + ",name=" + this.job.getId()); mbs.registerMBean(this, name); } catch (Exception e) { throw new JqmInitError("Could not create JMX bean for running job instance", e); } } } @Override public void run() { try { runPayload(); } catch (Throwable t) { jqmlogger.error("An unexpected error has occurred - the engine may have become unstable", t); } } private void runPayload() { // Set thread name Thread.currentThread().setName(threadName); // One log per launch? if (System.out instanceof MultiplexPrintStream) { String fileName = StringUtils.leftPad("" + this.job.getId(), 10, "0"); MultiplexPrintStream mps = (MultiplexPrintStream) System.out; mps.registerThread(String.valueOf(fileName + ".stdout.log")); mps = (MultiplexPrintStream) System.err; mps.registerThread(String.valueOf(fileName + ".stderr.log")); } // Log this.resultStatus = State.SUBMITTED; jqmlogger.debug("A loader/runner thread has just started for Job Instance " + job.getId() + ". Jar is: " + job.getJD().getJarPath() + " - class is: " + job.getJD().getJavaClassName()); final Map<String, String> params; final JarClassLoader jobClassLoader; final JobManagerHandler handler; this.node = this.job.getNode(); // Block needing the database DbConn cnx = null; try { cnx = Helpers.getNewDbSession(); // Disabled if (!this.job.getJD().isEnabled()) { jqmlogger.info("Job Instance " + job.getId() + " will actually not truly run as its Job Definition is disabled"); job.setProgress(-1); // Not persisted, but useful to endOfRunDb resultStatus = State.ENDED; endOfRun(); return; } // Parameters params = new HashMap<String, String>(); for (Map.Entry<String, String> jp : RuntimeParameter.select_map(cnx, "jiprm_select_by_ji", job.getId()).entrySet()) { jqmlogger.trace("Parameter " + jp.getKey() + " - " + jp.getValue()); params.put(jp.getKey(), jp.getValue()); } // Cache heating this.job.getJD().getClassLoader(cnx); jobClassLoader = this.clm.getClassloader(job, cnx); handler = new JobManagerHandler(job, params); // Update of the job status, dates & co this.job.setExecutionDate(Calendar.getInstance()); // For use in JMX QueryResult qr = cnx.runUpdate("jj_update_run_by_id", job.getId()); if (qr.nbUpdated == 0) { // This means the JI has been killed or has disappeared. jqmlogger.warn("Trying to run a job which disappeared or is not in ATTRIBUTED state (likely killed) " + job.getId()); if (p != null) { p.decreaseNbThread(job.getId()); } return; } cnx.commit(); } catch (JqmPayloadException e) { jqmlogger.warn("Could not resolve CLASSPATH for job " + job.getJD().getApplicationName(), e); resultStatus = State.CRASHED; endOfRun(); return; } catch (MalformedURLException e) { jqmlogger.warn("The JAR file path specified in Job Definition is incorrect " + job.getJD().getApplicationName(), e); resultStatus = State.CRASHED; endOfRun(); return; } catch (RuntimeException e) { firstBlockDbFailureAnalysis(e); return; } finally { Helpers.closeQuietly(cnx); } // Class loader switch classLoaderToRestoreAtEnd = Thread.currentThread().getContextClassLoader(); try { // Switch jqmlogger.trace("Setting class loader"); Thread.currentThread().setContextClassLoader(jobClassLoader); jqmlogger.trace("Class Loader was set correctly"); } catch (Exception e) { jqmlogger.error("Could not switch classloaders", e); this.resultStatus = State.CRASHED; endOfRun(); return; } // Go! (launches the main function in the startup class designated in the manifest) try { jobClassLoader.launchJar(job, params, clm, handler); this.resultStatus = State.ENDED; } catch (JqmKillException e) { jqmlogger.info("Job instance " + job.getId() + " has been killed."); this.resultStatus = State.KILLED; } catch (Exception e) { jqmlogger.info("Job instance " + job.getId() + " has crashed. Exception was:", e); this.resultStatus = State.CRASHED; } // Job instance has now ended its run try { endOfRun(); } catch (Exception e) { jqmlogger.error("An error occurred while finalizing the job instance.", e); } jqmlogger.debug("End of loader for JobInstance " + this.job.getId() + ". Thread will now end"); } /** * For external payloads. This is used to force the end of run. */ void endOfRun(State s) { this.resultStatus = s; endOfRun(); } private void endOfRun() { // Register end date as soon as possible to be as exact as possible (sending mails may take time for example) endDate = GregorianCalendar.getInstance(Locale.getDefault()); // This block is needed for external payloads, as the single runner may forcefully call endOfRun. synchronized (this) { if (!isDone) { isDone = true; } else { return; } } // Release the slot so as to allow other job instances to run (first op!) if (p != null) { p.decreaseNbThread(this.job.getId()); } // Send e-mail before releasing the slot - it may be long if (job.getEmail() != null) { try { Helpers.sendEndMessage(job); } catch (Exception e) { jqmlogger.warn("An e-mail could not be sent. No impact on the engine.", e); } } // Clean class loader ClassLoaderLeakCleaner.clean(Thread.currentThread().getContextClassLoader()); // Clean JDBC connections ClassLoaderLeakCleaner.cleanJdbc(Thread.currentThread()); // Restore class loader if (this.classLoaderToRestoreAtEnd != null) { Thread.currentThread().setContextClassLoader(classLoaderToRestoreAtEnd); jqmlogger.trace("Class Loader was correctly restored"); } // Clean temp dir (if it exists) File tmpDir = new File(FilenameUtils.concat(node.getTmpDirectory(), "" + job.getId())); if (tmpDir.isDirectory()) { try { if (FileUtils.deleteQuietly(tmpDir)) { jqmlogger.trace("temp directory was removed"); } else { jqmlogger.warn("Could not remove temp directory " + tmpDir.getAbsolutePath() + "for this job instance. There may be open handlers remaining open."); } } catch (Exception e) { jqmlogger.warn("Could not remove temp directory for unusual reasons", e); } } // Unregister MBean if (p != null && this.p.getEngine().loadJmxBeans) { try { MBeanServer mbs = ManagementFactory.getPlatformMBeanServer(); mbs.unregisterMBean(name); } catch (Exception e) { jqmlogger.error("Could not unregister JobInstance JMX bean", e); } } // Unregister logger unregisterLogger(); // Part needing DB connection with specific failure handling code. endOfRunDb(); } private void unregisterLogger() { if (System.out instanceof MultiplexPrintStream) { MultiplexPrintStream mps = (MultiplexPrintStream) System.out; mps.unregisterThread(); mps = (MultiplexPrintStream) System.err; mps.unregisterThread(); } } /** * Part of the endOfRun process that needs the database. May be deferred if the database is not available. */ void endOfRunDb() { DbConn cnx = null; try { cnx = Helpers.getNewDbSession(); // Done: put inside history & remove instance from queue. History.create(cnx, job, this.resultStatus, endDate); jqmlogger.trace("An History was just created for job instance " + this.job.getId()); cnx.runUpdate("ji_delete_by_id", this.job.getId()); cnx.commit(); } catch (RuntimeException e) { endBlockDbFailureAnalysis(e); } finally { Helpers.closeQuietly(cnx); } } private void firstBlockDbFailureAnalysis(Exception e) { if (Helpers.testDbFailure(e)) { jqmlogger.error("connection to database lost - loader " + this.getId() + " will be restarted later"); jqmlogger.trace("connection error was:", e); this.engine.loaderRestartNeeded(this); unregisterLogger(); return; } else { jqmlogger.error("a database related operation has failed and cannot be recovered", e); resultStatus = State.CRASHED; endOfRun(); return; } } private void endBlockDbFailureAnalysis(RuntimeException e) { if (Helpers.testDbFailure(e)) { jqmlogger.error("connection to database lost - loader " + this.getId() + " will need delayed finalization"); jqmlogger.trace("connection error was:", e.getCause()); this.engine.loaderFinalizationNeeded(this); this.isDelayed = true; } else { jqmlogger.error("a database related operation has failed and cannot be recovered", e); throw e; } } // //////////////////////////////////////////////////////////// // JMX methods // //////////////////////////////////////////////////////////// @Override public void kill() { Properties props = new Properties(); props.put("com.enioka.jqm.jdbc.contextobject", Helpers.getDb()); JqmClientFactory.getClient("uncached", props, false).killJob(this.job.getId()); } @Override public String getApplicationName() { return this.job.getJD().getApplicationName(); } @Override public Calendar getEnqueueDate() { return this.job.getCreationDate(); } @Override public String getKeyword1() { return this.job.getKeyword1(); } @Override public String getKeyword2() { return this.job.getKeyword2(); } @Override public String getKeyword3() { return this.job.getKeyword3(); } @Override public String getModule() { return this.job.getModule(); } @Override public String getUser() { return this.job.getUserName(); } @Override public String getSessionId() { return this.job.getSessionID(); } @Override public Integer getId() { return this.job.getId(); } @Override public Long getRunTimeSeconds() { if (this.job.getExecutionDate() == null) { DbConn cnx = Helpers.getNewDbSession(); this.job.setExecutionDate(cnx.runSelectSingle("ji_select_execution_date_by_id", Calendar.class, this.job.getId())); cnx.close(); } if (this.job.getExecutionDate() == null) { return 0L; } return (Calendar.getInstance().getTimeInMillis() - this.job.getExecutionDate().getTimeInMillis()) / 1000; } }