All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.fasterxml.sort.IteratingSorter Maven / Gradle / Ivy

package com.fasterxml.sort;

import com.fasterxml.sort.util.CastingIterator;
import com.fasterxml.sort.util.SegmentedBuffer;

import java.io.Closeable;
import java.io.File;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Comparator;
import java.util.Iterator;
import java.util.List;
import java.util.NoSuchElementException;

public class IteratingSorter extends SorterBase implements Closeable
{
    // Set iff sort spilled to disk
    private List _mergerInputs;
    private DataReader _merger;


    public IteratingSorter(SortConfig config,
                           DataReaderFactory readerFactory,
                           DataWriterFactory writerFactory,
                           Comparator comparator)
    {
        super(config, readerFactory, writerFactory, comparator);
    }

    public IteratingSorter() {
        super();
    }

    public IteratingSorter(SortConfig config) {
        super(config);
    }

    /**
     * Method that will perform full sort on input data read using given
     * {@link DataReader}.
     *
     * Conversions to and from intermediate sort files is done
     * using {@link DataReaderFactory} and {@link DataWriterFactory} configured
     * for this sorter.
     *
     * The returned Iterator will throw {@link IterableSorterException} if any
     * IOException is encountered during calls of {@link Iterator#next()}.
     *
     * @return Iterator if sorting complete and output is ready to be written; null if it was cancelled
     */
    public Iterator sort(DataReader inputReader)
        throws IOException
    {
        // Clean up any previous sort
        close();

        // First, pre-sort:
        _phase = Phase.PRE_SORTING;
        boolean inputClosed = false;

        SegmentedBuffer buffer = new SegmentedBuffer();
        _presortFileCount = 0;
        _sortRoundCount = -1;
        _currentSortRound = -1;

        Iterator iterator = null;
        try {
            Object[] items = _readMax(inputReader, buffer, _config.getMaxMemoryUsage(), null);
            if (_checkForCancel()) {
                close();
                return null;
            }
            Arrays.sort(items, _rawComparator());
            T next = inputReader.readNext();
            /* Minor optimization: in case all entries might fit in
             * in-memory sort buffer, avoid writing intermediate file
             * and just write results directly.
             */
            if (next == null) {
                inputClosed = true;
                inputReader.close();
                _phase = Phase.SORTING;
                iterator = new CastingIterator(Arrays.asList(items).iterator());
            } else { // but if more data than memory-buffer-full, do it right:
                List presorted = new ArrayList();
                presorted.add(_writePresorted(items));
                items = null; // it's a big array, clear refs as early as possible
                _presort(inputReader, buffer, next, presorted);
                inputClosed = true;
                inputReader.close();
                _phase = Phase.SORTING;
                if (_checkForCancel(presorted)) {
                    close();
                    return null;
                }
                _mergerInputs = merge(presorted);
                _merger = _createMergeReader(_mergerInputs);
                iterator = new MergerIterator(_merger);
            }
        } finally {
            if (!inputClosed) {
                try {
                    inputReader.close();
                } catch (IOException e) {
                    // Ignore
                }
            }
        }
        if (_checkForCancel()) {
            close();
            return null;
        }
        _phase = Phase.COMPLETE;
        return iterator;
    }


    /*
    /**********************************************************************
    /* Closeable API
    /**********************************************************************
    */

    @Override
    public void close() {
        if (_merger != null) {
            try {
                _merger.close();
            }
            catch (IOException e) {
                // Ignore
            }
        }
        if (_mergerInputs != null) {
            for (File input : _mergerInputs) {
                input.delete();
            }
        }
        _mergerInputs = null;
        _merger = null;
    }

    /*
    /**********************************************************************
    /* Iterator implementations
    /**********************************************************************
    */

    private static class MergerIterator implements Iterator {
        private final DataReader _merger;
        private T _next;

        private MergerIterator(DataReader merger) throws IOException {
            _merger = merger;
            _next = _merger.readNext();
        }

        @Override
        public boolean hasNext() {
            return (_next != null);
        }

        @Override
        public T next() {
            if (_next == null) {
                throw new NoSuchElementException();
            }
            T t = _next;
            try {
                _next = _merger.readNext();
            } catch (IOException e) {
                throw new IterableSorterException(e);
            }
            return t;
        }

        @Override
        public void remove() {
            throw new UnsupportedOperationException();
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy