
io.virtdata.stathelpers.aliasmethod.WeightedStrings Maven / Gradle / Ivy
package io.virtdata.stathelpers.aliasmethod;
import io.virtdata.api.ThreadSafeMapper;
import io.virtdata.stathelpers.EvProbD;
import io.virtdata.util.ResourceFinder;
import org.apache.commons.csv.CSVParser;
import org.apache.commons.csv.CSVRecord;
import java.util.ArrayList;
import java.util.List;
import java.util.function.LongFunction;
@ThreadSafeMapper
public class WeightedStrings implements LongFunction {
private final String[] filenames;
private final String valueColumn;
private final String weightColumn;
private final String[] lines;
private final AliasSampler sampler;
public WeightedStrings(String valueColumn, String weightColumn, String... filenames) {
this.filenames = filenames;
this.valueColumn = valueColumn;
this.weightColumn = weightColumn;
List events = new ArrayList<>();
List values = new ArrayList<>();
for (String filename: filenames) {
CSVParser csvdata = ResourceFinder.readFileCSV(filename);
for (CSVRecord csvdatum : csvdata) {
String value = csvdatum.get(valueColumn);
values.add(value);
String weight = csvdatum.get(weightColumn);
events.add(new EvProbD(values.size()-1,Double.valueOf(weight)));
}
}
sampler = new AliasSampler(events);
lines = values.toArray(new String[0]);
}
@Override
public String apply(long value) {
double unitValue = (double) value / (double) Long.MAX_VALUE;
int idx = sampler.applyAsInt(unitValue);
return lines[idx];
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy