com.enioka.jqm.tools.QueuePoller Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jqm-engine Show documentation
Show all versions of jqm-engine Show documentation
A library containing the JQM engine. Cannot be used alone.
/**
* Copyright © 2013 enioka. All rights reserved
* Authors: Marc-Antoine GOUILLART ([email protected])
* Pierre COPPEE ([email protected])
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.enioka.jqm.tools;
import java.lang.management.ManagementFactory;
import java.util.Calendar;
import java.util.Date;
import java.util.List;
import java.util.Map;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.Semaphore;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicInteger;
import javax.management.InstanceNotFoundException;
import javax.management.MBeanServer;
import javax.management.ObjectName;
import javax.persistence.EntityManager;
import javax.persistence.EntityNotFoundException;
import javax.persistence.LockModeType;
import javax.persistence.LockTimeoutException;
import org.apache.log4j.Logger;
import com.enioka.jqm.jpamodel.DeploymentParameter;
import com.enioka.jqm.jpamodel.JobInstance;
import com.enioka.jqm.jpamodel.Queue;
import com.enioka.jqm.jpamodel.State;
/**
* A thread that polls a queue according to the parameters defined inside a {@link DeploymentParameter}.
*/
class QueuePoller implements Runnable, QueuePollerMBean
{
private static Logger jqmlogger = Logger.getLogger(QueuePoller.class);
private Queue queue = null;
private JqmEngine engine;
private int maxNbThread = 10;
private int pollingInterval = 10000;
private boolean run = true;
private AtomicInteger actualNbThread = new AtomicInteger(0);
private boolean hasStopped = true;
private Calendar lastLoop = null;
private Map peremption = new ConcurrentHashMap();
private ObjectName name = null;
private Thread localThread = null;
private Semaphore loop;
@Override
public void stop()
{
jqmlogger.info("Poller has received a stop order");
run = false;
if (localThread != null)
{
localThread.interrupt();
}
}
/**
* Will make the thread ready to run once again after it has stopped.
*/
void reset()
{
if (!hasStopped)
{
throw new IllegalStateException("cannot reset a non stopped queue poller");
}
hasStopped = false;
run = true;
lastLoop = null;
loop = new Semaphore(0);
}
QueuePoller(JqmEngine engine, Queue q, int nbThreads, int interval)
{
jqmlogger.info("Engine " + engine.getNode().getName() + " will poll JobInstances on queue " + q.getName() + " every "
+ interval / 1000 + "s with " + nbThreads + " threads for concurrent instances");
EntityManager em = Helpers.getNewEm();
this.engine = engine;
this.queue = q;
this.pollingInterval = interval;
this.maxNbThread = nbThreads;
em.close();
reset();
registerMBean();
}
private void registerMBean()
{
try
{
if (this.engine.loadJmxBeans)
{
MBeanServer mbs = ManagementFactory.getPlatformMBeanServer();
name = new ObjectName(
"com.enioka.jqm:type=Node.Queue,Node=" + this.engine.getNode().getName() + ",name=" + this.queue.getName());
// Unregister MBean if it already exists. This may happen during frequent DP modifications.
try
{
mbs.getMBeanInfo(name);
mbs.unregisterMBean(name);
}
catch (InstanceNotFoundException e)
{
// Nothing to do, this should be the normal case.
}
mbs.registerMBean(this, name);
}
}
catch (Exception e)
{
throw new JqmInitError("Could not create JMX beans", e);
}
}
protected JobInstance dequeue(EntityManager em, int additionalSlots)
{
// Free room?
if (actualNbThread.get() >= maxNbThread)
{
return null;
}
// Get the list of all jobInstance within the defined queue, ordered by position
List availableJobs = em
.createQuery(
"SELECT j FROM JobInstance j LEFT JOIN FETCH j.jd WHERE j.queue = :q AND j.state = :s ORDER BY j.internalPosition ASC",
JobInstance.class)
.setParameter("q", queue).setParameter("s", State.SUBMITTED).setMaxResults(maxNbThread + additionalSlots).getResultList();
em.getTransaction().begin();
int rejectedCauseHighlander = 0;
for (JobInstance res : availableJobs)
{
// Lock is given when object is read, not during select... stupid.
// So we must check if the object is still SUBMITTED.
try
{
em.refresh(res, LockModeType.PESSIMISTIC_WRITE);
}
catch (EntityNotFoundException e)
{
// It has already been eaten and finished by another engine
// JPA2 dictates that in this case, the transaction is marked as rollback only.
// But beware, rollback detaches all entities from the session! So we simply give up and retry.
// As this is a very rare case, this is acceptable performance-wise.
em.getTransaction().rollback();
return dequeue(em, rejectedCauseHighlander);
}
catch (LockTimeoutException e)
{
// Just give up. We'll get another chance later.
em.getTransaction().rollback();
return null;
}
if (!res.getState().equals(State.SUBMITTED))
{
// Already eaten by another engine, not yet done
continue;
}
// Highlander?
if (res.getJd().isHighlander() && !highlanderPollingMode(res, em))
{
rejectedCauseHighlander++;
continue;
}
// Reserve the JI for this engine. Use a query rather than setter to avoid updating all fields (and locks when verifying FKs)
em.createQuery(
"UPDATE JobInstance j SET j.state = 'ATTRIBUTED', j.node = :n, j.attributionDate = current_timestamp() WHERE id=:i")
.setParameter("i", res.getId()).setParameter("n", this.engine.getNode()).executeUpdate();
// Stop at the first suitable JI. Release the lock & update the JI which has been attributed to us.
em.getTransaction().commit();
return res;
}
// If here, no suitable JI is available
em.getTransaction().rollback();
if (rejectedCauseHighlander > additionalSlots)
{
return dequeue(em, rejectedCauseHighlander);
}
return null;
}
/**
*
* @param jobToTest
* @param em
* @return true if job can be launched even if it is in highlander mode
*/
protected boolean highlanderPollingMode(JobInstance jobToTest, EntityManager em)
{
List jobs = em.createQuery(
"SELECT j FROM JobInstance j WHERE j IS NOT :refid AND j.jd = :jd AND (j.state = 'RUNNING' OR j.state = 'ATTRIBUTED')",
JobInstance.class).setParameter("refid", jobToTest).setParameter("jd", jobToTest.getJd()).getResultList();
return jobs.isEmpty();
}
@Override
public void run()
{
this.localThread = Thread.currentThread();
this.localThread.setName("QUEUE_POLLER;polling;" + this.queue.getName());
EntityManager em = null;
while (true)
{
lastLoop = Calendar.getInstance();
try
{
// Get a JI to run
em = Helpers.getNewEm();
JobInstance ji = dequeue(em, 0);
while (ji != null)
{
// We will run this JI!
jqmlogger.trace("JI number " + ji.getId() + " will be run by this poller this loop (already " + actualNbThread + "/"
+ maxNbThread + " on " + this.queue.getName() + ")");
actualNbThread.incrementAndGet();
if (ji.getJd().getMaxTimeRunning() != null)
{
this.peremption.put(ji.getId(), new Date((new Date()).getTime() + ji.getJd().getMaxTimeRunning() * 60 * 1000));
}
// Run it
if (!ji.getJd().isExternal())
{
(new Thread(new Loader(ji, this.engine, this, this.engine.getClassloaderManager()))).start();
}
else
{
(new Thread(new LoaderExternal(em, ji, this))).start();
}
// Check if there is another job to run (does nothing - no db query - if queue is full so this is not expensive)
ji = dequeue(em, 0);
}
}
catch (RuntimeException e)
{
if (Helpers.testDbFailure(e))
{
jqmlogger.error("connection to database lost - stopping poller");
jqmlogger.trace("connection error was:", e.getCause());
this.hasStopped = true;
this.engine.pollerRestartNeeded(this);
break;
}
else
{
jqmlogger.error("Queue poller has failed!", e);
throw e;
}
}
finally
{
// Reset the em on each loop.
Helpers.closeQuietly(em);
}
// Wait according to the deploymentParameter
try
{
loop.tryAcquire(this.pollingInterval, TimeUnit.MILLISECONDS);
}
catch (InterruptedException e)
{
run = false;
break;
}
// Exit if asked to
if (!run)
{
break;
}
}
if (!run)
{
// Run is true only if the loop has exited abnormally, in which case the engine should try to restart the poller
// So only do the graceful shutdown procedure if normal shutdown.
jqmlogger
.info("Poller loop on queue " + this.queue.getName() + " is stopping [engine " + this.engine.getNode().getName() + "]");
waitForAllThreads(60L * 1000);
jqmlogger.info("Poller on queue " + this.queue.getName() + " has ended normally");
// JMX
if (this.engine.loadJmxBeans)
{
try
{
ManagementFactory.getPlatformMBeanServer().unregisterMBean(name);
}
catch (Exception e)
{
jqmlogger.error("Could not unregister JMX beans", e);
}
}
// Let the engine decide if it should stop completely
this.hasStopped = true; // BEFORE check
this.engine.checkEngineEnd();
}
else
{
// else => Abnormal stop. Set booleans to reflect this.
this.run = false;
this.hasStopped = true;
}
}
@Override
public Integer getCurrentActiveThreadCount()
{
return actualNbThread.get();
}
/**
* Called when a payload thread has ended. This notifies the poller to free a slot and poll once again.
*/
void decreaseNbThread(int jobId)
{
this.peremption.remove(jobId);
this.actualNbThread.decrementAndGet();
loop.release(1);
this.engine.signalEndOfRun();
}
boolean isRunning()
{
return !this.hasStopped;
}
private void waitForAllThreads(long timeOutMs)
{
long timeWaitedMs = 0;
long stepMs = 1000;
while (timeWaitedMs <= timeOutMs)
{
jqmlogger.trace("Waiting the end of " + actualNbThread + " job(s)");
if (actualNbThread.get() == 0)
{
break;
}
if (timeWaitedMs == 0)
{
jqmlogger.info("Waiting for the end of " + actualNbThread + " jobs on queue " + this.queue.getName() + " - timeout is "
+ timeOutMs + "ms");
}
try
{
Thread.sleep(stepMs);
}
catch (InterruptedException e)
{
// Interruption => stop right now
jqmlogger.warn("Some job instances did not finish in time - wait was interrupted");
Thread.currentThread().interrupt();
return;
}
timeWaitedMs += stepMs;
}
if (timeWaitedMs > timeOutMs)
{
jqmlogger.warn("Some job instances did not finish in time - they will be killed for the poller to be able to stop");
}
}
Queue getQueue()
{
return this.queue;
}
JqmEngine getEngine()
{
return this.engine;
}
void setMaxThreads(int max)
{
if (this.maxNbThread > 0 && max == 0)
{
jqmlogger.info("Poller is being paused - it won't fetch any new job instances until it is resumed.");
}
else if (this.maxNbThread == 0 && max > 0)
{
jqmlogger.info("Poller is being resumed");
}
this.maxNbThread = max;
}
void setPollingInterval(int ms)
{
this.pollingInterval = ms;
}
// //////////////////////////////////////////////////////////
// JMX
// //////////////////////////////////////////////////////////
@Override
public long getCumulativeJobInstancesCount()
{
EntityManager em2 = Helpers.getNewEm();
Long nb = em2.createQuery("SELECT COUNT(i) From History i WHERE i.node = :n AND i.queue = :q", Long.class)
.setParameter("n", this.engine.getNode()).setParameter("q", this.queue).getSingleResult();
em2.close();
return nb;
}
@Override
public float getJobsFinishedPerSecondLastMinute()
{
EntityManager em2 = Helpers.getNewEm();
Calendar minusOneMinute = Calendar.getInstance();
minusOneMinute.add(Calendar.MINUTE, -1);
Float nb = em2.createQuery("SELECT COUNT(i) From History i WHERE i.endDate >= :d and i.node = :n AND i.queue = :q", Long.class)
.setParameter("d", minusOneMinute).setParameter("n", this.engine.getNode()).setParameter("q", this.queue).getSingleResult()
/ 60f;
em2.close();
return nb;
}
@Override
public long getCurrentlyRunningJobCount()
{
return this.actualNbThread.get();
}
@Override
public Integer getPollingIntervalMilliseconds()
{
return this.pollingInterval;
}
@Override
public Integer getMaxConcurrentJobInstanceCount()
{
return this.maxNbThread;
}
@Override
public boolean isActuallyPolling()
{
// 100ms is a rough estimate of the time taken to do the actual poll. If it's more, there is a huge issue elsewhere.
return (Calendar.getInstance().getTimeInMillis() - this.lastLoop.getTimeInMillis()) <= pollingInterval + 100;
}
@Override
public boolean isFull()
{
return this.actualNbThread.get() >= maxNbThread;
}
@Override
public int getLateJobs()
{
int i = 0;
Date now = new Date();
for (Date d : this.peremption.values())
{
if (now.after(d))
{
i++;
}
}
return i;
}
}