com.barrybecker4.simulation.reactiondiffusion.algorithm.GrayScottController Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of bb4-reactiondiffusion Show documentation
bb4-simulation java code.
There is a newer version: 1.6.2
Show newest version
/** Copyright by Barry G. Becker, 2000-2011. Licensed under MIT License: http://www.opensource.org/licenses/MIT  */
package com.barrybecker4.simulation.reactiondiffusion.algorithm;

import com.barrybecker4.common.concurrency.Parallelizer;
import com.barrybecker4.simulation.reactiondiffusion.RDProfiler;

import java.awt.*;
import java.util.ArrayList;
import java.util.List;

/**
 * Makes the GrayScott algorithm run concurrently if setParallelized is set to true.
 * Primary purpose of this class is to handle breaking the algorithm up into concurrent worker threads.
 *
 * Here are some parallelism results using my Core2Duo 6400 (and later i7 2600k) using fixed size.
 * Without parallelism  8.62 fps
 * With parallelism (but not borders) 10.16 fps
 * With parallelism (and borders in sep thread) 10.36 fps
 * After more tuning 18 fps (num steps per frame = 10)
 *
 * Using offscreen rendering slowed things by about 10%
 * These numbers are with Hyperthreading off. The difference compared to hyperthreading off is barely 10%.
 *
 *                       pr/ns  pr/sync  npr/ns  npr/synch
 *                      ------- -------  -------  -------
 * parallel calc       | 23.8     21.1    20.9    20.5
 * n-par calc          | 19.0     17.1            17.0
 * n-par calc/offscreen|                  12.8    12.9
 * par calc/offscreen  | 17.2     14.2    14.3    14.1
 *
 *   pr/ns : parallel rendering/ no synchronized
 *   npr/ns : no parallel rendering no synchronization.
 *   Parallel rendering without synchronization is fast, but has bad rendering artifacts.
 *
 * Made some more improvements
 *   - upgraded to ci7 2600k with 4 cores and 8 threads (hyper-threaded).
 *   - fixed a bug in Model.commit where I was using arrayCopy instead of just a pointer swap.
 *   - Modified parallel rendering code so that I compute images and write them quickly
 *     rather than drawing individual points which needed to be synchronized (set color, then draw point)
 * Notes
 *   - The difference between onscreen and offscreen rendering seems negligible.
 *   - Getting really great CPU utilization of cores - somewhere around 85%.
 *   - The temperature of the CPU really heats up. Saw max temp of 76C.
 *
 *                       par rend          non-par rendering
 *                      ------------       --------------
 * parallel calc       |   180 fps             78 fps
 * n-par calc          |   102 fps             66 fps
 *
 * For larger rectangle than fixed the performance increases seem even better
 *
 *                       par rend          non-par rendering
 *                      ------------       --------------
 * parallel calc       |   19.5 fps            8.1 fps
 * n-par calc          |   13.2 fps            6.8 fps
 *
 *
 * @author Barry Becker
 */
public final class GrayScottController {

    /** default values for constants. */
    public static final double H0 = 0.01;

    /** Manages the worker threads. */
    private Parallelizer parallelizer;

    private GrayScottModel model_;

    private GrayScottAlgorithm algorithm_;

    /** null if no new size has been requested. */
    private Dimension requestedNewSize;


    /**
     * Constructor
     * @param width width of computational space.
     * @param height height of computational space.
     */
    public GrayScottController(int width, int height) {
        model_ = new GrayScottModel(width, height);
        algorithm_ = new GrayScottAlgorithm(model_);
        setParallelized(true);
    }

    public GrayScottModel getModel() {
        return model_;
    }

    /**
     * doesn't change the size immediately since running threads may
     * be using the current array. We wait until the current timeStep completes
     * before reinitializing with the new size.
     */
    public void setSize(int width, int height) {
        requestedNewSize = new Dimension(width, height);
    }


    public void reset() {
        algorithm_.setH(H0);
        model_.resetState();
    }

    public void setH(double h) {
        algorithm_.setH(h);
    }

    /**
     * Set this to true if you want to run the version
     * that will partition the task of computing the next timeStop
     * into smaller pieces that can be run on different threads.
     * This should speed things up on a multi-core computer.
     */
    public void setParallelized(boolean parallelized) {
         parallelizer =
             parallelized ? new Parallelizer() : new Parallelizer(1);
    }

    public boolean isParallelized() {
       return (parallelizer.getNumThreads() > 1);
    }

    /**
     * Advance one time step increment.
     * u and v are calculated based on tmpU and tmpV, then the result is committed to tmpU and tmpV.
     *
     * @param dt time step in seconds.
     */
    public void timeStep(final double dt) {

        int numThreads = parallelizer.getNumThreads();
        List workers = new ArrayList(numThreads + 1);
        int range = model_.getWidth() / numThreads;
        RDProfiler prof = RDProfiler.getInstance();

        prof.startConcurrentCalculationTime();
        for (int i = 0; i < (numThreads - 1); i++) {
            int offset = i * range;
            workers.add(new Worker(1 + offset, offset + range, dt));
        }

        int minXEdge = range * (numThreads - 1) + 1;
        int maxXEdge = model_.getWidth() - 2;
        workers.add(new Worker(minXEdge, maxXEdge, dt));

        // also add the border calculations in a separate thread.
        Runnable edgeWorker = new Runnable() {
            public void run() {
                algorithm_.computeNewEdgeValues(dt);
            }
        };
        workers.add(edgeWorker);

        // blocks until all Callables are done running.
        parallelizer.invokeAllRunnables(workers);
        prof.stopConcurrentCalculationTime();

        prof.startCommitChangesTime();
        model_.commitChanges();
        prof.stopCommitChangesTime();

        if (requestedNewSize != null) {
             model_.setSize(requestedNewSize);
             requestedNewSize = null;
             reset();
        }
    }

    /**
     * Runs one of the chunks.
     */
    private class Worker implements Runnable {
        private int minX_, maxX_;
        private double dt_;

        public Worker(int minX, int maxX, double dt) {
            minX_ = minX;
            maxX_ = maxX;
            dt_ = dt;
        }

        @Override
        public void run() {
            algorithm_.computeNextTimeStep(minX_, maxX_, dt_);
        }
    }
}