All Downloads are FREE. Search and download functionalities are using the official Maven repository.

tri.timeseries.io.TimeSeriesUrlCachingProcessor.kt Maven / Gradle / Ivy

The newest version!
/*-
 * #%L
 * coda-data-0.2.9-SNAPSHOT
 * --
 * Copyright (C) 2020 - 2023 Elisha Peterson
 * --
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *      http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * #L%
 */
package tri.timeseries.io

import tri.timeseries.*
import tri.util.measureTimedValue
import java.io.InputStream
import java.net.URL

/** Processes URLs to a remote location. */
abstract class TimeSeriesUrlCachingProcessor(val rawSources: () -> List,
                                             val processed: () -> URL,
                                             val resourceLoader: (URL) -> InputStream,
                                             val resourceExists: (URL) -> Boolean): TimeSeriesProcessor() {

    override fun toString() = "TimeSeriesUrlCachingProcessor ${rawSources()}"

    override fun loadProcessed(): List {
        val url = processed()
        return TimeSeriesCachingProcessor.logLoadProcessedResource(url, resourceExists(url)) {
            TimeSeriesFileFormat.readSeries(resourceLoader(it), Charsets.UTF_8)
        }
    }

    open fun process(series: List) = measureTimedValue {
        series.regroupAndMax(coerceIncreasing = false, replaceZerosWithPrevious = false)
    }.let {
        processingNote("Regrouped data into ${it.value.size} time series in ${it.duration}")
        it.value
    }

    override fun loadRaw() = process(rawSources().flatMap { url ->
        measureTimedValue {
            processingNote("Loading data from $url...")
            inprocess(url)
        }.let {
            processingNote("Loaded ${it.value.size} rows in ${it.duration} from $url")
            it.value
        }
    })

    abstract fun inprocess(url: URL): List

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy