
com.yahoo.vespa.config.proxy.filedistribution.UrlDownloadRpcServer Maven / Gradle / Ivy
// Copyright 2019 Oath Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.vespa.config.proxy.filedistribution;
import com.yahoo.concurrent.DaemonThreadFactory;
import com.yahoo.jrt.Method;
import com.yahoo.jrt.Request;
import com.yahoo.jrt.StringValue;
import com.yahoo.jrt.Supervisor;
import java.util.logging.Level;
import com.yahoo.text.Utf8;
import com.yahoo.vespa.defaults.Defaults;
import net.jpountz.xxhash.XXHashFactory;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileOutputStream;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.net.HttpURLConnection;
import java.net.URL;
import java.nio.ByteBuffer;
import java.nio.channels.Channels;
import java.nio.channels.ReadableByteChannel;
import java.nio.file.Files;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.logging.Logger;
import static com.yahoo.vespa.config.UrlDownloader.DOES_NOT_EXIST;
import static com.yahoo.vespa.config.UrlDownloader.HTTP_ERROR;
import static com.yahoo.vespa.config.UrlDownloader.INTERNAL_ERROR;
/**
* An RPC server that handles URL download requests.
*
* @author lesters
*/
class UrlDownloadRpcServer {
private final static Logger log = Logger.getLogger(UrlDownloadRpcServer.class.getName());
private static final String CONTENTS_FILE_NAME = "contents";
private static final String LAST_MODIFIED_FILE_NAME = "lastmodified";
static final File downloadDir = new File(Defaults.getDefaults().underVespaHome("var/db/vespa/download"));
private final ExecutorService rpcDownloadExecutor = Executors.newFixedThreadPool(Math.max(8, Runtime.getRuntime().availableProcessors()),
new DaemonThreadFactory("Rpc URL download executor"));
UrlDownloadRpcServer(Supervisor supervisor) {
supervisor.addMethod(new Method("url.waitFor", "s", "s", this::download)
.methodDesc("get path to url download")
.paramDesc(0, "url", "url")
.returnDesc(0, "path", "path to file"));
}
void close() {
rpcDownloadExecutor.shutdownNow();
try {
rpcDownloadExecutor.awaitTermination(10, TimeUnit.SECONDS);
} catch (InterruptedException e) {
throw new RuntimeException(e);
}
}
private void download(Request req) {
req.detach();
rpcDownloadExecutor.execute(() -> downloadFile(req));
}
private void downloadFile(Request req) {
String url = req.parameters().get(0).asString();
File downloadDir = new File(UrlDownloadRpcServer.downloadDir, urlToDirName(url));
try {
URL website = new URL(url);
HttpURLConnection connection = (HttpURLConnection) website.openConnection();
setIfModifiedSince(connection, downloadDir); // don't download if we already have the file
if (connection.getResponseCode() == 200) {
log.log(Level.INFO, "Downloading URL '" + url + "'");
downloadFile(req, connection, downloadDir);
} else if (connection.getResponseCode() == 304) {
log.log(Level.INFO, "URL '" + url + "' already downloaded (server response: 304)");
req.returnValues().add(new StringValue(new File(downloadDir, CONTENTS_FILE_NAME).getAbsolutePath()));
} else {
log.log(Level.SEVERE, "Download of URL '" + url + "' got server response: " + connection.getResponseCode());
req.setError(HTTP_ERROR, String.valueOf(connection.getResponseCode()));
}
} catch (Throwable e) {
log.log(Level.SEVERE, "Download of URL '" + url + "' got exception: " + e.getMessage());
req.setError(INTERNAL_ERROR, "Download of URL '" + url + "' internal error: " + e.getMessage());
}
req.returnRequest();
}
private static void downloadFile(Request req, HttpURLConnection connection, File downloadDir) throws IOException {
long start = System.currentTimeMillis();
String url = connection.getURL().toString();
Files.createDirectories(downloadDir.toPath());
File contentsPath = new File(downloadDir, CONTENTS_FILE_NAME);
try (ReadableByteChannel rbc = Channels.newChannel(connection.getInputStream())) {
try (FileOutputStream fos = new FileOutputStream((contentsPath.getAbsolutePath()))) {
fos.getChannel().transferFrom(rbc, 0, Long.MAX_VALUE);
if (contentsPath.exists() && contentsPath.length() > 0) {
writeLastModifiedTimestamp(downloadDir, connection.getLastModified());
new RequestTracker().trackRequest(downloadDir);
req.returnValues().add(new StringValue(contentsPath.getAbsolutePath()));
log.log(Level.FINE, () -> "URL '" + url + "' available at " + contentsPath);
log.log(Level.INFO, String.format("Download of URL '%s' done in %.3f seconds",
url, (System.currentTimeMillis() -start) / 1000.0));
} else {
log.log(Level.SEVERE, "Downloaded URL '" + url + "' not found, returning error");
req.setError(DOES_NOT_EXIST, "Downloaded '" + url + "' not found");
}
}
}
}
private static String urlToDirName(String uri) {
return String.valueOf(XXHashFactory.fastestJavaInstance().hash64().hash(ByteBuffer.wrap(Utf8.toBytes(uri)), 0));
}
private static void setIfModifiedSince(HttpURLConnection connection, File downloadDir) throws IOException {
File contents = new File(downloadDir, CONTENTS_FILE_NAME);
if (contents.exists() && contents.length() > 0) {
long lastModified = readLastModifiedTimestamp(downloadDir);
if (lastModified > 0) {
connection.setIfModifiedSince(lastModified);
}
}
}
private static long readLastModifiedTimestamp(File downloadDir) throws IOException {
File lastModified = new File(downloadDir, LAST_MODIFIED_FILE_NAME);
if (lastModified.exists() && lastModified.length() > 0) {
try (BufferedReader br = new BufferedReader(new FileReader(lastModified))) {
String timestamp = br.readLine();
return Long.parseLong(timestamp);
}
}
return 0;
}
private static void writeLastModifiedTimestamp(File downloadDir, long timestamp) throws IOException {
File lastModified = new File(downloadDir, LAST_MODIFIED_FILE_NAME);
try (BufferedWriter lastModifiedWriter = new BufferedWriter(new FileWriter(lastModified.getAbsolutePath()))) {
lastModifiedWriter.write(Long.toString(timestamp));
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy