All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.duracloud.mill.ltp.LoopingTaskProducer Maven / Gradle / Ivy

The newest version!
/*
 * The contents of this file are subject to the license and copyright
 * detailed in the LICENSE and NOTICE files at the root of the source
 * tree and available online at
 *
 *     http://duracloud.org/license/
 */
package org.duracloud.mill.ltp;

import java.io.File;
import java.io.IOException;
import java.net.InetAddress;
import java.net.UnknownHostException;
import java.text.MessageFormat;
import java.time.LocalTime;
import java.util.Calendar;
import java.util.Date;
import java.util.HashMap;
import java.util.LinkedHashSet;
import java.util.LinkedList;
import java.util.List;
import java.util.Map;
import java.util.Queue;
import java.util.Set;
import java.util.Timer;
import java.util.TimerTask;

import org.duracloud.common.queue.TaskQueue;
import org.duracloud.mill.common.storageprovider.StorageProviderFactory;
import org.duracloud.mill.credentials.AccountCredentialsNotFoundException;
import org.duracloud.mill.credentials.CredentialsRepo;
import org.duracloud.mill.credentials.CredentialsRepoException;
import org.duracloud.mill.credentials.StorageProviderCredentials;
import org.duracloud.mill.notification.NotificationManager;
import org.duracloud.storage.provider.StorageProvider;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

/**
 * This class is responsible for filling the duplication TaskQueue
 * by looping through all duplication policies for all accounts and spaces and
 * blindly creates duplication tasks. It will create tasks for all items in the
 * the source destination as well as all items in the destination provider but
 * not in the source provider. A notable feature of this task producer is that
 * it attempts to respect a designated maximum task queue size. Once the limit
 * has been reached, the producer will stop. On subsequent runs, the producer
 * will pick up where it left off, starting with the next account,space,set of
 * content items, and duplication store policy. If all content items are visited
 * within a single run before the task queue limit has been reached, the
 * producer will exit.
 *
 * For more information about how this process fits into the whole system of
 * collaborating components, see
 * https://wiki.duraspace.org/display/DSPINT/DuraCloud+Duplication+-+System+Overview
 *
 * @author Daniel Bernstein
 * Date: Nov 5, 2013
 */
public abstract class LoopingTaskProducer implements Runnable {
    private static Logger log = LoggerFactory.getLogger(LoopingTaskProducer.class);
    private TaskQueue taskQueue;
    private CredentialsRepo credentialsRepo;
    private StateManager stateManager;
    private int maxTaskQueueSize;
    private StorageProviderFactory storageProviderFactory;
    private List morselsToReload = new LinkedList<>();
    private Frequency frequency;
    private LocalTime startTime;
    private RunStats cumulativeTotals;
    private NotificationManager notificationManager;
    private LoopingTaskProducerConfigurationManager config;
    private Map runstats = new HashMap<>();

    public LoopingTaskProducer(CredentialsRepo credentialsRepo,
                               StorageProviderFactory storageProviderFactory,
                               TaskQueue taskQueue,
                               StateManager state,
                               int maxTaskQueueSize,
                               Frequency frequency,
                               LocalTime startTime,
                               NotificationManager notificationManager,
                               LoopingTaskProducerConfigurationManager config) {

        this.credentialsRepo = credentialsRepo;
        this.storageProviderFactory = storageProviderFactory;
        this.taskQueue = taskQueue;
        this.stateManager = state;
        this.credentialsRepo = credentialsRepo;
        this.maxTaskQueueSize = maxTaskQueueSize;
        this.frequency = frequency;
        this.startTime = startTime;
        this.cumulativeTotals = createRunStats();
        this.notificationManager = notificationManager;
        this.config = config;
    }

    protected Frequency getFrequency() {
        return this.frequency;
    }

    protected CredentialsRepo getCredentialsRepo() {
        return credentialsRepo;
    }

    protected TaskQueue getTaskQueue() {
        return taskQueue;
    }

    protected int getMaxTaskQueueSize() {
        return maxTaskQueueSize;
    }

    public void run() {

        Timer timer = new Timer();
        try {

            timer.scheduleAtFixedRate(new TimerTask() {
                @Override
                public void run() {
                    logSessionStats();
                }

            }, 5 * 60 * 1000, 5 * 60 * 1000);

            if (runLater()) {
                return;
            }

            log.info("Starting run...");
            Queue morselQueue = loadMorselQueue();

            while (!morselQueue.isEmpty() && this.taskQueue.size() < maxTaskQueueSize) {
                T morsel = morselQueue.peek();

                if (morsel != null) {
                    //check that account is still active
                    //if not remove from list, but only if
                    //it has not yet been started.  If an account becomes
                    //inactive in the middle of processing a morsel,  then
                    //allow to finish even if it results in errors.
                    String account = morsel.getAccount();
                    try {
                        if (!this.credentialsRepo.isAccountActive(account)) {
                            if (morsel.getMarker() == null) {
                                log.info("account {} has become inactive.  Abandonning morsel {}.", account, morsel);
                                morselQueue.poll();
                                continue;
                            } else {
                                String message = MessageFormat
                                    .format("account {0} has become inactive in the middle of processing {1}. "
                                            + "  Allowing this morsel to continue but failure is likely.  "
                                            + "\nExpect items to appear in the dead letter queue shortly.",
                                            account, morsel);
                                log.warn(message);
                                sendEmail(getSimpleName() +
                                          " attempting into account after start of morsel processing.",
                                          message);
                            }
                        }
                    } catch (AccountCredentialsNotFoundException ex) {
                        String message =
                            MessageFormat.format("account {0} does not exist.  Abandonning morsel {1}.",
                                                 account, morsel);
                        log.warn(message);
                        sendEmail(getSimpleName() + " attempted to access into non-existent account", message);

                    }
                }
                nibble(morselQueue);
                persistMorsels(morselQueue, morselsToReload);

                if (morselQueue.isEmpty()) {
                    morselQueue = reloadMorselQueue();
                } else {
                    //break if nothing was removed from the queue
                    //if nothing was removed from the queue we can assume
                    //that the for whatever reason the morsel could not be processed
                    //at this time, so the process should wait for the next run.
                    if (morsel.equals(morselQueue.peek())) {
                        break;
                    }
                }

            }

            logSessionStats();

            if (morselQueue.isEmpty()) {
                scheduleNextRun();
                writeCompletionFile();
            }

            log.info("Session ended.");
        } catch (Exception ex) {
            log.error("failed to complete run on " + getSimpleName() + ": " + ex.getMessage(), ex);
            sendEmail( "failed to complete run on " + getSimpleName(),
                       ex.getClass().getCanonicalName() + ":" + ex.getMessage() );
        } finally {
            timer.cancel();
        }
    }

    private String getSimpleName() {
        return getClass().getSimpleName();
    }

    /**
     * Writes zero length file to the work directory to mark the completion of a run.
     */
    private void writeCompletionFile() {
        File completionFile = getCompletionFile();
        try {
            if (completionFile.createNewFile()) {
                log.info("successfully created completion marker file: {}",
                         completionFile.getAbsolutePath());
            } else {
                log.warn("completion marker file unexpectably exists already " +
                         "- something may be amiss: {}",
                         completionFile.getAbsolutePath());

            }
        } catch (IOException e) {
            log.error("Unable to create the completion file {}: {}",
                      completionFile.getAbsolutePath(),
                      e.getMessage());
        }
    }

    /**
     * Deletes the completion marker file if it exists.
     */
    private void deleteCompletionFileIfExists() {
        File completionFile = getCompletionFile();
        if (completionFile.exists()) {
            completionFile.delete();
        }
    }

    /**
     * @return
     */
    private File getCompletionFile() {
        return new File(this.config.getWorkDirectoryPath(),
                        getLoopingProducerTypePrefix() + "-producer-complete.txt");
    }

    private void resetIncrementalSessionStats() {
        synchronized (runstats) {
            for (String account : runstats.keySet()) {
                RunStats stats = runstats.get(account);
                stats.reset();
            }
        }
    }

    protected RunStats calculateStatTotals(RunStats currentTotals) {
        RunStats totals = createRunStats();
        totals.copyValuesFrom(currentTotals);

        synchronized (runstats) {
            for (String account : runstats.keySet()) {
                RunStats stats = runstats.get(account);
                totals.add(stats);
            }
            return totals;
        }
    }

    private void logSessionStats() {
        synchronized (runstats) {
            for (String account : runstats.keySet()) {
                RunStats stats = runstats.get(account);
                logIncrementalStatsByAccount(account, stats);
            }

            RunStats incrementalTotals = calculateStatTotals(createRunStats());
            logGlobalncrementalStats(incrementalTotals);

            this.cumulativeTotals = calculateStatTotals(cumulativeTotals);
            logCumulativeSessionStats(runstats, this.cumulativeTotals);
            resetIncrementalSessionStats();
        }
    }

    /**
     *
     */
    private void scheduleNextRun() {
        Date currentStartDate = this.stateManager.getCurrentRunStartDate();
        Date nextRun = calculateNextRunDate(currentStartDate);
        this.stateManager.setNextRunStartDate(nextRun);
        this.stateManager.setCurrentRunStartDate(null);

        String hostname = "unknown";
        try {
            hostname = InetAddress.getLocalHost().getHostName();
        } catch (UnknownHostException e) {
            log.error("unable to get hostname:" + e.getMessage());
        }

        String subject = getClass().getSimpleName() + "'s run completed on " + hostname;
        StringBuilder builder = new StringBuilder();
        builder.append(subject + "\n");
        builder.append(this.cumulativeTotals.toString() + "\n");

        if (nextRun != null) {
            builder.append("Scheduling the next run for " + nextRun + "\n");
            log.info(subject + ": next run will start " + nextRun);
        }

        sendEmail(subject, builder.toString());
    }

    private Date calculateNextRunDate(Date previousDate) {
        Date nextRun;
        Calendar c = Calendar.getInstance();
        //if the current start date is null calculate based on present moment.
        if (previousDate == null) {
            //if a start time is defined
            if (this.startTime != null) {
                //calculate based on start time.
                c.set(Calendar.HOUR_OF_DAY, this.startTime.getHour());
                c.set(Calendar.MINUTE, this.startTime.getMinute());
                c.set(Calendar.SECOND, this.startTime.getSecond());

                //if the start time is before the present moment
                LocalTime now = LocalTime.now();
                if (this.startTime.isBefore(now)) {
                    // if less than 10 minutes has passed since the start time,
                    // allow the next run to occur now (don't push to tomorrow)
                    LocalTime startTimePlusTen = LocalTime.of(startTime.getHour(),
                                                              startTime.getMinute() + 10,
                                                              startTime.getSecond());
                    if (startTimePlusTen.isAfter(now)) {
                        log.info("Less than 10 minutes has passed since the scheduled start time, " +
                                 "allowing run to begin now.");
                    } else {
                        //move to the following day
                        log.info("The start time has passed for today. " +
                                 "Setting next run to occur tomorrow");
                        c.add(Calendar.DATE, 1);
                    }
                }
                nextRun = c.getTime();
            } else {
                //next run is now
                nextRun = new Date();
            }

        } else {  //otherwise calculate based on previous  date
            //add the frequency
            c.setTimeInMillis(previousDate.getTime());
            c.add(this.frequency.getTimeUnit(), this.frequency.getValue());
            nextRun = c.getTime();
        }

        //return null if the frequency is zero or less.
        if (this.frequency.getValue() <= 0) {
            nextRun = null;
        }

        return nextRun;
    }

    protected void sendEmail(String subject, String body) {
        this.notificationManager.sendEmail(subject, body);
    }

    /**
     * @return true if the process should wait until later
     */
    private boolean runLater() {
        boolean runLater = true;
        Date nextRun = this.stateManager.getNextRunStartDate();

        if (nextRun != null) {
            Date now = new Date();
            if (getFrequency().getValue() <= 0) {
                log.info("The frequency is set to {}: all scheduled runs will be cancelled.",
                         getFrequency());
                this.stateManager.setNextRunStartDate(null);
            } else if (now.after(nextRun)) {
                deleteCompletionFileIfExists();
                this.stateManager.setCurrentRunStartDate(now);
                this.stateManager.setNextRunStartDate(null);
                runLater = false;
                log.info("Time to start a new run: the next run was scheduled to run on {}. Let's roll.", nextRun);
            } else {
                log.info("It's not yet time start a new run: the next run is scheduled to run on {}.", nextRun);
            }
        } else {
            Date currentRunStartDate = this.stateManager.getCurrentRunStartDate();
            if (currentRunStartDate == null && getFrequency().getValue() <= 0) {
                log.info("The frequency is set to {}: no future runs will be scheduled.", getFrequency());
            } else {
                if (currentRunStartDate == null) {
                    Date startDate = calculateNextRunDate(null);

                    if (startDate.getTime() <= System.currentTimeMillis()) {
                        this.stateManager.setCurrentRunStartDate(startDate);
                        log.info("We're starting the first run on this machine");
                    } else {
                        this.stateManager.setNextRunStartDate(startDate);
                        log.info("We will start the first run on this machine at {}", startDate);
                        return true;
                    }
                } else {
                    log.info("We're continuing the current run which was started on {}", currentRunStartDate);
                }
                runLater = false;
            }
        }

        return runLater;
    }

    /**
     * @return
     */
    private MorselQueue reloadMorselQueue() {
        List morsels = morselsToReload;
        morselsToReload = new LinkedList<>();
        MorselQueue queue = new MorselQueue<>();
        queue.addAll(morsels);
        return queue;
    }

    /**
     * Loads the morsels from the persistent state if there are any; otherwise it loads  all other morsels based on
     * on duplication policy manager.
     *
     * @return
     */
    private Queue loadMorselQueue() {
        Queue morselQueue = createQueue();

        //load morsels from state;
        Set morsels = new LinkedHashSet<>(this.stateManager.getMorsels());

        morselQueue.addAll(morsels);

        if (morselQueue.isEmpty()) {
            loadMorselQueueFromSource(morselQueue);
        }

        return morselQueue;
    }

    /**
     * @return
     */
    protected Queue createQueue() {
        return new LinkedList();
    }

    private void persistMorsels(Queue queue, List morselsToReload) {
        LinkedHashSet morsels = new LinkedHashSet<>();
        morsels.addAll(queue);
        morsels.addAll(morselsToReload);
        stateManager.setMorsels(morsels);
    }

    /**
     * @param morsel
     */
    protected void addToReloadList(T morsel) {
        log.info("adding morsel to reload list: {}", morsel);
        morselsToReload.add(morsel);
    }

    /**
     * @param account
     * @return
     */
    protected RunStats getStats(String account) {
        synchronized (runstats) {
            RunStats stats = this.runstats.get(account);
            if (stats == null) {
                this.runstats.put(account, stats = createRunStats());
            }
            return stats;
        }
    }

    protected StorageProvider getStorageProvider(String account,
                                                 String storeId) {
        StorageProviderCredentials creds;
        try {
            creds = credentialsRepo.getStorageProviderCredentials(account, storeId);
        } catch (CredentialsRepoException e) {
            throw new RuntimeException(e);
        }

        return getStorageProvider(creds);
    }

    /**
     * @param creds
     * @return
     */
    protected StorageProvider getStorageProvider(StorageProviderCredentials creds) {
        return storageProviderFactory.create(creds);
    }

    /**
     * @param morselQueue
     */
    protected abstract void loadMorselQueueFromSource(Queue morselQueue);

    /**
     * @param queue
     */
    protected abstract void nibble(Queue queue);

    /**
     * @return
     */
    protected abstract RunStats createRunStats();

    /**
     * @param incrementalTotals
     */
    protected abstract void logGlobalncrementalStats(RunStats incrementalTotals);

    /**
     * @param account
     * @param stats
     */
    protected abstract void logIncrementalStatsByAccount(String account, RunStats stats);

    /**
     * @param runstats
     * @param cumulativeTotals
     */
    protected abstract void logCumulativeSessionStats(Map runstats, RunStats cumulativeTotals);

    /**
     * A short looping producer type identifier for use with state files.
     *
     * @return
     */
    protected abstract String getLoopingProducerTypePrefix();

    /**
     * @param message
     * @param ex
     */
    protected void sendEmail(String message, Exception ex) {
        StackTraceElement[] stackTrace = ex.getStackTrace();
        StringBuilder builder = new StringBuilder();
        for (StackTraceElement ste : stackTrace) {
            builder.append(ste.toString() + "\n");
        }
        sendEmail(message, builder.toString());
    }

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy