io.hyperfoil.tools.horreum.changedetection.HunterEDivisiveModel Maven / Gradle / Ivy
package io.hyperfoil.tools.horreum.changedetection;
import java.io.BufferedReader;
import java.io.File;
import java.io.FileOutputStream;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.OutputStream;
import java.io.PrintWriter;
import java.nio.file.Files;
import java.nio.file.Path;
import java.time.Instant;
import java.util.Arrays;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.function.Consumer;
import java.util.function.Function;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.stream.Collectors;
import jakarta.enterprise.context.ApplicationScoped;
import org.jboss.logging.Logger;
import com.fasterxml.jackson.databind.JsonNode;
import com.fasterxml.jackson.databind.node.TextNode;
import io.hyperfoil.tools.horreum.api.data.ConditionConfig;
import io.hyperfoil.tools.horreum.api.data.changeDetection.ChangeDetectionModelType;
import io.hyperfoil.tools.horreum.entity.alerting.ChangeDAO;
import io.hyperfoil.tools.horreum.entity.alerting.DataPointDAO;
@ApplicationScoped
public class HunterEDivisiveModel implements ChangeDetectionModel {
private static final Logger log = Logger.getLogger(HunterEDivisiveModel.class);
public static final String HUNTER_CONFIG = "HUNTER_CONFIG";
private static String[] HEADERS = { "kpi", "timestamp", "datasetid" };
private static final Pattern datapointPattern = Pattern.compile(
"(?^\\d{4}-[01]\\d-[0-3]\\d\\s[0-2]\\d:[0-5]\\d:[0-5]\\d)\\s[+|-]\\d{4}\\s+(?\\d+)\\s+(?\\d+?\\.?\\d+)$");
@Override
public ConditionConfig config() {
ConditionConfig conditionConfig = new ConditionConfig(ChangeDetectionModelType.names.EDIVISIVE, "eDivisive - Hunter",
"This model uses the Hunter eDivisive algorithm to determine change points in a continual series.");
conditionConfig.defaults.put("model", new TextNode(ChangeDetectionModelType.names.EDIVISIVE));
return conditionConfig;
}
@Override
public ChangeDetectionModelType type() {
return ChangeDetectionModelType.EDIVISIVE;
}
@Override
public void analyze(List dataPoints, JsonNode configuration, Consumer changeConsumer)
throws ChangeDetectionException {
TmpFiles tmpFiles = null;
try {
try {
tmpFiles = TmpFiles.instance();
} catch (IOException e) {
String errMsg = "Could not create temporary file for Hunter eDivisive algorithm";
log.error(errMsg, e);
throw new ChangeDetectionException(errMsg, e);
}
try (final FileWriter fw = new FileWriter(tmpFiles.inputFile, true);
final PrintWriter pw = new PrintWriter(fw);) {
Collections.reverse(dataPoints);
//write out csv fields
pw.println(Arrays.stream(HEADERS).collect(Collectors.joining(",")));
dataPoints.forEach(dataPointDAO -> pw.println(
String.format("%.2f,%s,%d", dataPointDAO.value, dataPointDAO.timestamp.toString(), dataPointDAO.id)));
} catch (IOException e) {
String errMsg = "Could not create file writer for Hunter eDivisive algorithm";
log.error(errMsg, e);
throw new ChangeDetectionException(errMsg, e);
}
log.debugf("created csv output : %s", tmpFiles.inputFile.getAbsolutePath());
if (!validateInputCsv(tmpFiles)) {
String errMsg = String.format("could not validate: %s", tmpFiles.inputFile);
log.error(errMsg);
throw new ChangeDetectionException(errMsg);
}
DataPointDAO firstDatapoint = dataPoints.get(0);
processChangePoints(
(dataPointID) -> dataPoints.stream().filter(dataPoint -> dataPoint.id.equals(dataPointID)).findFirst(),
changeConsumer,
tmpFiles,
firstDatapoint.timestamp);
} finally {
if (tmpFiles != null) {
tmpFiles.cleanup();
}
}
}
protected void processChangePoints(Function> changePointSupplier,
Consumer changeConsumer, TmpFiles tmpFiles, Instant sinceInstance) {
String command = "hunter analyze horreum --since '" + sinceInstance.toString() + "'";
log.debugf("Running command: %s", command);
List results = executeProcess(tmpFiles, false, "bash", "-l", "-c", command);
/*
* We are parsing the result file from Hunter, which has the following format;
* INFO: Computing change points for test horreum...
* time datasetid kpi
* ------------------------- ----------- -----
* 2024-04-27 06:55:06 +0000 1 1
* ...
* 2024-04-27 06:55:06 +0000 8 2
* 2024-04-27 06:55:06 +0000 9 2
* ·····
* +542.9%
* ·····
* 2024-04-27 06:55:06 +0000 10 10
*/
//if there are no results, the file will contain only the header
if (results.size() > 3) {
Iterator resultIter = results.iterator();
while (resultIter.hasNext()) {
String line = resultIter.next();
//change points are denoted by a series of '··' characters
//the line after the '··' contains the change point details
if (line.contains("··")) {
String change = resultIter.next().trim();
resultIter.next(); // skip line after the change details containing '··'
String changeDetails = resultIter.next(); //the next line is the datapoint that the change was detected for
Matcher foundChange = datapointPattern.matcher(changeDetails);
if (foundChange.matches()) {
String timestamp = foundChange.group("timestamp");
Integer datapointID = Integer.parseInt(foundChange.group("dataPointId"));
log.debugf("Found change point `%s` at `%s` for dataset: %d", change, timestamp, datapointID);
Optional foundDataPoint = changePointSupplier.apply(datapointID);
if (foundDataPoint.isPresent()) {
ChangeDAO changePoint = ChangeDAO.fromDatapoint(foundDataPoint.get());
changePoint.description = String.format("eDivisive change `%s` at `%s` for dataset: %d", change,
timestamp, datapointID);
log.trace(changePoint.description);
changeConsumer.accept(changePoint);
} else {
log.errorf("Could not find datapoint (%d) in set!", datapointID);
}
} else {
log.errorf("Could not parse hunter line: '%s'", changeDetails);
}
}
}
} else {
log.debugf("No change points were detected in : %s", tmpFiles.tmpdir.getAbsolutePath());
}
}
protected boolean validateInputCsv(TmpFiles tmpFiles) {
executeProcess(tmpFiles, true, "bash", "-l", "-c", "hunter validate");
try (FileReader fileReader = new FileReader(tmpFiles.logFile);
BufferedReader reader = new BufferedReader(fileReader);) {
Optional optLine = reader.lines().filter(line -> line.contains("Validation finished")).findFirst();
if (optLine.isEmpty()) {
log.errorf("Could not validate: %s", tmpFiles.tmpdir.getAbsolutePath());
return false;
}
if (optLine.get().contains("INVALID")) {
log.errorf("Invalid format for: %s; see log for details: %s", tmpFiles.tmpdir.getAbsolutePath(),
tmpFiles.logFile.getAbsolutePath());
return false;
}
} catch (IOException e) {
throw new RuntimeException(e);
}
return true;
}
@Override
public ModelType getType() {
return ModelType.BULK;
}
protected static class TmpFiles {
final File inputFile;
final File tmpdir;
final File confFile;
final File logFile;
public static TmpFiles instance() throws IOException {
return new TmpFiles();
}
public TmpFiles() throws IOException {
tmpdir = Files.createTempDirectory("hunter").toFile();
Path respourcesPath = Path.of(tmpdir.getAbsolutePath(), "tests", "resources");
Files.createDirectories(respourcesPath);
inputFile = Path.of(respourcesPath.toFile().getAbsolutePath(), "horreum.csv").toFile();
confFile = Path.of(respourcesPath.toFile().getAbsolutePath(), "hunter.yaml").toFile();
logFile = Path.of(respourcesPath.toFile().getAbsolutePath(), "hunter.log").toFile();
try (InputStream confInputStream = HunterEDivisiveModel.class.getClassLoader()
.getResourceAsStream("changeDetection/hunter.yaml")) {
if (confInputStream == null) {
log.error("Could not extract Hunter configuration from archive");
return;
}
try (OutputStream confOut = new FileOutputStream(confFile)) {
confOut.write(confInputStream.readAllBytes());
} catch (IOException e) {
log.error("Could not extract Hunter configuration from archive");
}
} catch (IOException e) {
log.error("Could not create temporary file for Hunter eDivisive algorithm", e);
}
}
protected void cleanup() {
if (tmpdir.exists()) {
clearDir(tmpdir);
} else {
log.debugf("Trying to cleanup temp files, but they do not exist!");
}
}
private void clearDir(File dir) {
Arrays.stream(dir.listFiles()).forEach(file -> {
if (file.isDirectory()) {
clearDir(file);
}
file.delete();
});
if (!dir.delete()) {
log.errorf("Failed to cleanup up temporary files: %s", dir.getAbsolutePath());
}
}
}
protected List executeProcess(TmpFiles tmpFiles, boolean redirectOutput, String... command) {
ProcessBuilder processBuilder = new ProcessBuilder(command);
Map env = processBuilder.environment();
env.put(HUNTER_CONFIG, tmpFiles.confFile.getAbsolutePath());
processBuilder.directory(tmpFiles.tmpdir);
processBuilder.redirectErrorStream(redirectOutput);
if (redirectOutput)
processBuilder.redirectOutput(ProcessBuilder.Redirect.appendTo(tmpFiles.logFile));
Process process = null;
try {
process = processBuilder.start();
List results = readOutput(process.getInputStream());
int exitCode = process.waitFor();
if (exitCode != 0) {
log.errorf("Hunter process failed with exit code: %d", exitCode);
log.errorf("See error log for details: %s", tmpFiles.logFile.getAbsolutePath());
return null;
}
return results;
} catch (IOException | InterruptedException e) {
if (process != null) {
process.destroy();
}
throw new RuntimeException(e);
}
}
private List readOutput(InputStream inputStream) throws IOException {
try (BufferedReader output = new BufferedReader(new InputStreamReader(inputStream))) {
return output.lines()
.collect(Collectors.toList());
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy