org.apache.flink.client.program.DefaultPackagedProgramRetriever Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.client.program;
import org.apache.flink.annotation.VisibleForTesting;
import org.apache.flink.client.deployment.application.EntryClassInformationProvider;
import org.apache.flink.client.deployment.application.FromClasspathEntryClassInformationProvider;
import org.apache.flink.client.deployment.application.FromJarEntryClassInformationProvider;
import org.apache.flink.configuration.ConfigUtils;
import org.apache.flink.configuration.Configuration;
import org.apache.flink.configuration.PipelineOptions;
import org.apache.flink.util.FileUtils;
import org.apache.flink.util.FlinkException;
import org.apache.flink.util.function.FunctionUtils;
import javax.annotation.Nullable;
import java.io.File;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.nio.file.Files;
import java.nio.file.Path;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.List;
import java.util.NoSuchElementException;
import java.util.stream.Collectors;
import java.util.stream.Stream;
import static org.apache.flink.util.Preconditions.checkNotNull;
/**
* {@code PackageProgramRetrieverImpl} is the default implementation of {@link
* PackagedProgramRetriever} that can either retrieve a {@link PackagedProgram} from a specific jar,
* some provided user classpath or the system classpath.
*/
public class DefaultPackagedProgramRetriever implements PackagedProgramRetriever {
private final EntryClassInformationProvider entryClassInformationProvider;
private final String[] programArguments;
private final List userClasspath;
private final Configuration configuration;
/**
* See ${@link DefaultPackagedProgramRetriever#create(File, File, Collection, String, String[],
* Configuration)} .
*/
public static DefaultPackagedProgramRetriever create(
@Nullable File userLibDir,
@Nullable String jobClassName,
String[] programArgs,
Configuration configuration)
throws FlinkException {
return create(userLibDir, null, jobClassName, programArgs, configuration);
}
/**
* See ${@link DefaultPackagedProgramRetriever#create(File, File, Collection, String, String[],
* Configuration)} .
*/
public static DefaultPackagedProgramRetriever create(
@Nullable File userLibDir,
@Nullable File jarFile,
@Nullable String jobClassName,
String[] programArgs,
Configuration configuration)
throws FlinkException {
return create(userLibDir, jarFile, null, jobClassName, programArgs, configuration);
}
/**
* Creates a {@code PackageProgramRetrieverImpl} with the given parameters.
*
* @param userLibDir The user library directory that is used for generating the user classpath
* if specified. The system classpath is used if not specified.
* @param jarFile The jar archive expected to contain the job class included; {@code null} if
* the job class is on the system classpath.
* @param userArtifacts The user artifacts that should be added to the user classpath if
* specified.
* @param jobClassName The job class to use; if {@code null} the user classpath (or, if not set,
* the system classpath) will be scanned for possible main class.
* @param programArgs The program arguments.
* @param configuration The Flink configuration for the given job.
* @return The {@code PackageProgramRetrieverImpl} that can be used to create a {@link
* PackagedProgram} instance.
* @throws FlinkException If something goes wrong during instantiation.
*/
public static DefaultPackagedProgramRetriever create(
@Nullable File userLibDir,
@Nullable File jarFile,
@Nullable Collection userArtifacts,
@Nullable String jobClassName,
String[] programArgs,
Configuration configuration)
throws FlinkException {
List userClasspaths;
try {
final List classpathsFromUserLibDir =
getClasspathsFromUserLibDir(userLibDir, jarFile);
final List classpathsFromUserArtifactDir =
getClasspathsFromArtifacts(userArtifacts, jarFile);
final List classpathsFromConfiguration =
getClasspathsFromConfiguration(configuration);
final List classpaths = new ArrayList<>();
classpaths.addAll(classpathsFromUserLibDir);
classpaths.addAll(classpathsFromUserArtifactDir);
classpaths.addAll(classpathsFromConfiguration);
userClasspaths = Collections.unmodifiableList(classpaths);
} catch (IOException e) {
throw new FlinkException("An error occurred while extracting the user classpath.", e);
}
final EntryClassInformationProvider entryClassInformationProvider =
createEntryClassInformationProvider(
(userLibDir == null && userArtifacts == null) ? null : userClasspaths,
jarFile,
jobClassName,
programArgs);
return new DefaultPackagedProgramRetriever(
entryClassInformationProvider, programArgs, userClasspaths, configuration);
}
@VisibleForTesting
static EntryClassInformationProvider createEntryClassInformationProvider(
@Nullable Iterable userClasspath,
@Nullable File jarFile,
@Nullable String jobClassName,
String[] programArgs)
throws FlinkException {
if (PackagedProgramUtils.isPython(jobClassName)
|| PackagedProgramUtils.isPython(programArgs)) {
return FromJarEntryClassInformationProvider.createFromPythonJar();
}
if (jarFile != null) {
return FromJarEntryClassInformationProvider.createFromCustomJar(jarFile, jobClassName);
}
if (userClasspath != null) {
return fromUserClasspath(jobClassName, userClasspath);
}
return fromSystemClasspath(jobClassName);
}
private static EntryClassInformationProvider fromSystemClasspath(@Nullable String jobClassName)
throws FlinkException {
if (jobClassName != null) {
return FromClasspathEntryClassInformationProvider
.createWithJobClassAssumingOnSystemClasspath(jobClassName);
}
try {
return FromClasspathEntryClassInformationProvider.createFromSystemClasspath();
} catch (IOException | NoSuchElementException | IllegalArgumentException t) {
throw createGenericFlinkException(t);
}
}
private static EntryClassInformationProvider fromUserClasspath(
@Nullable String jobClassName, Iterable userClasspath) throws FlinkException {
try {
if (jobClassName != null) {
return FromClasspathEntryClassInformationProvider.create(
jobClassName, userClasspath);
}
return FromClasspathEntryClassInformationProvider.createFromClasspath(userClasspath);
} catch (IOException e) {
throw createGenericFlinkException(e);
}
}
private static FlinkException createGenericFlinkException(Throwable t) {
return new FlinkException("An error occurred while access the provided classpath.", t);
}
private DefaultPackagedProgramRetriever(
EntryClassInformationProvider entryClassInformationProvider,
String[] programArguments,
List userClasspath,
Configuration configuration) {
this.entryClassInformationProvider =
checkNotNull(
entryClassInformationProvider, "No EntryClassInformationProvider passed.");
this.programArguments =
checkNotNull(programArguments, "No program parameter array passed.");
this.userClasspath = checkNotNull(userClasspath, "No user classpath passed.");
this.configuration = checkNotNull(configuration, "No Flink configuration was passed.");
}
@Override
public PackagedProgram getPackagedProgram() throws FlinkException {
try {
final PackagedProgram.Builder packagedProgramBuilder =
PackagedProgram.newBuilder()
.setUserClassPaths(userClasspath)
.setArguments(programArguments)
.setConfiguration(configuration);
entryClassInformationProvider
.getJobClassName()
.ifPresent(packagedProgramBuilder::setEntryPointClassName);
entryClassInformationProvider
.getJarFile()
.ifPresent(packagedProgramBuilder::setJarFile);
return packagedProgramBuilder.build();
} catch (ProgramInvocationException e) {
throw new FlinkException("Could not load the provided entrypoint class.", e);
}
}
private static List getClasspathsFromUserLibDir(
@Nullable File userLibDir, @Nullable File jarFile) throws IOException {
if (userLibDir == null) {
return Collections.emptyList();
}
try (Stream files = Files.walk(userLibDir.toPath())) {
return getClasspathsFromArtifacts(files, jarFile);
}
}
private static List getClasspathsFromArtifacts(
@Nullable Collection userArtifacts, @Nullable File jarFile) {
if (userArtifacts == null) {
return Collections.emptyList();
}
return getClasspathsFromArtifacts(userArtifacts.stream().map(File::toPath), jarFile);
}
private static List getClasspathsFromArtifacts(
Stream userArtifacts, @Nullable File jarFile) {
checkNotNull(userArtifacts);
final Path workingDirectory = FileUtils.getCurrentWorkingDirectory();
final List relativeJarURLs =
userArtifacts
.filter(path -> FileUtils.isJarFile(path) && !path.toFile().equals(jarFile))
.map(path -> FileUtils.relativizePath(workingDirectory, path))
.map(FunctionUtils.uncheckedFunction(FileUtils::toURL))
.collect(Collectors.toList());
return Collections.unmodifiableList(relativeJarURLs);
}
private static List getClasspathsFromConfiguration(Configuration configuration)
throws MalformedURLException {
if (configuration == null) {
return Collections.emptyList();
}
return ConfigUtils.decodeListFromConfig(
configuration, PipelineOptions.CLASSPATHS, URL::new);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy