All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.radanalytics.operator.cluster.InitContainersHelper Maven / Gradle / Ivy

There is a newer version: 1.0.4
Show newest version
package io.radanalytics.operator.cluster;

import io.fabric8.kubernetes.api.model.*;
import io.radanalytics.operator.historyServer.HistoryServerHelper;
import io.radanalytics.types.*;

import java.util.ArrayList;
import java.util.List;
import java.util.Optional;
import java.util.function.Predicate;

import static io.radanalytics.operator.Constants.getDefaultSparkImage;

public class InitContainersHelper {

    private static final String NEW_CONF_DIR = "conf-new-dir";
    private static final String NEW_CONF_DIR_PATH = "/tmp/config/new";
    private static final String DEFAULT_SPARK_HOME_PATH = "/opt/spark/";

    /**
     * Based on the SparkCluster configuration, it can add init-containers called 'downloader', 'backup-config' and/or
     * 'override-config'. The firs one will be added if the cluster.getDownloadData() is not empty, while the
     * latter two are always being added together if config map that overrides the default spark configuration exist in the
     * K8s or if the cluster.getSparkConfiguration() is not empty.
     *
     * Optionally adds the init containers that do:
     * 
    *
  1. makes the path for the history server writable by group
  2. *
  3. downloads the data with curl if it's specified
  4. *
  5. backups the original (default) Spark configuration into NEW_CONF_DIR_PATH
  6. *
  7. copies/replaces the config files in the NEW_CONF_DIR_PATH with the files coming from the config map
  8. *
  9. overrides (/appends) the key-value entries in the NEW_CONF_DIR_PATH/spark-defaults.conf
  10. *
  11. use the configuration NEW_CONF_DIR_PATH as the configuration for the spark
  12. *
* * * @param rc ReplicationController instance * @param cluster SparkCluster instance * @param cmExists whether config map with overrides exists * @return modified ReplicationController instance */ public static final ReplicationController addInitContainers(ReplicationController rc, SparkCluster cluster, boolean cmExists, boolean isMaster) { PodSpec podSpec = rc.getSpec().getTemplate().getSpec(); if (isMaster && HistoryServerHelper.needsVolume(cluster)) { createChmodHistoryServerContainer(cluster, podSpec); } if (!cluster.getDownloadData().isEmpty()) { createDownloader(cluster, podSpec); } if (cmExists || !cluster.getSparkConfiguration().isEmpty()) { createBackupContainer(cluster, podSpec); createConfigOverrideContainer(cluster, podSpec, cmExists); } rc.getSpec().getTemplate().setSpec(podSpec); return rc; } private static Container createDownloader(SparkCluster cluster, PodSpec podSpec) { final String mountName = "data-dir"; final String mountPath = "/tmp/"; final VolumeMount downloadMount = new VolumeMountBuilder().withName(mountName).withMountPath(mountPath).build(); final Volume downloadVolume = new VolumeBuilder().withName(mountName).withNewEmptyDir().endEmptyDir().build(); final List downloadData = cluster.getDownloadData(); final StringBuilder downloaderCmd = new StringBuilder(); downloadData.forEach(dl -> { String url = dl.getUrl(); String to = dl.getTo(); // if 'to' ends with slash, we know it's a directory and we use the -P switch to change the prefix, // otherwise using -O for renaming the downloaded file String param = to.endsWith("/") ? " -P " : " -O "; downloaderCmd.append("wget "); downloaderCmd.append(url); downloaderCmd.append(param); downloaderCmd.append(to); downloaderCmd.append(" ; "); }); Container downloader = new ContainerBuilder() .withName("downloader") .withImage("busybox") .withImagePullPolicy("IfNotPresent") .withCommand("/bin/sh", "-xc") .withArgs(downloaderCmd.toString()) .withVolumeMounts(downloadMount) .build(); podSpec.getContainers().get(0).getVolumeMounts().add(downloadMount); podSpec.getVolumes().add(downloadVolume); podSpec.getInitContainers().add(downloader); return downloader; } private static Container createBackupContainer(SparkCluster cluster, PodSpec podSpec) { final VolumeMount backupMount = new VolumeMountBuilder().withName(NEW_CONF_DIR).withMountPath(NEW_CONF_DIR_PATH).build(); final Volume backupVolume = new VolumeBuilder().withName(NEW_CONF_DIR).withNewEmptyDir().endEmptyDir().build(); Container backup = new ContainerBuilder() .withName("backup-config") .withImage(Optional.ofNullable(cluster.getCustomImage()).orElse(getDefaultSparkImage())) .withCommand("/bin/sh", "-xc") .withArgs("cp -r " + getSparkHome(cluster) + "/conf/* " + NEW_CONF_DIR_PATH) .withVolumeMounts(backupMount) .build(); podSpec.getContainers().get(0).getVolumeMounts().add(backupMount); podSpec.getVolumes().add(backupVolume); podSpec.getInitContainers().add(backup); return backup; } private static Container createChmodHistoryServerContainer(SparkCluster cluster, PodSpec podSpec) { SharedVolume sharedVolume = Optional.ofNullable(cluster.getHistoryServer().getSharedVolume()).orElse(new SharedVolume()); final VolumeMount mount = new VolumeMountBuilder().withName("history-server-volume").withMountPath(sharedVolume.getMountPath()).build(); Container chmod = new ContainerBuilder() .withName("chmod-history-server") // .withNewSecurityContext().withPrivileged(true).endSecurityContext() .withImage("busybox") .withCommand("/bin/sh", "-xc") .withArgs("mkdir -p " + sharedVolume.getMountPath() + " || true ; chmod -R go+ws " + sharedVolume.getMountPath() + " || true") .withVolumeMounts(mount) .build(); Volume historyVolume = new VolumeBuilder() .withName("history-server-volume") .withNewPersistentVolumeClaim() .withReadOnly(false) .withClaimName(cluster.getName() + "-claim") .endPersistentVolumeClaim() .build(); podSpec.getContainers().get(0).getVolumeMounts().add(mount); podSpec.getVolumes().add(historyVolume); podSpec.getInitContainers().add(chmod); return chmod; } private static Container createConfigOverrideContainer(SparkCluster cluster, PodSpec podSpec, boolean cmExists) { final List config = cluster.getSparkConfiguration(); String cmMountName = "configmap-dir"; String cmMountPath = "/tmp/config/fromCM"; List mounts = new ArrayList<>(2); if (cmExists) { String cmName = getExpectedCMName(cluster); final VolumeMount cmMount = new VolumeMountBuilder().withName(cmMountName).withMountPath(cmMountPath).build(); final Volume cmVolume = new VolumeBuilder().withName(cmMountName).withNewConfigMap().withName(cmName).endConfigMap().build(); podSpec.getVolumes().add(cmVolume); mounts.add(cmMount); } final VolumeMount backupMount = new VolumeMountBuilder().withName(NEW_CONF_DIR).withMountPath(NEW_CONF_DIR_PATH).build(); final String origConfMountName = "conf-orig-dir"; final VolumeMount origConfMount = new VolumeMountBuilder().withName(origConfMountName).withMountPath(getSparkHome(cluster) + "/conf/").build(); final Volume origConfVolume = new VolumeBuilder().withName(origConfMountName).withNewEmptyDir().endEmptyDir().build(); mounts.add(backupMount); mounts.add(origConfMount); final StringBuilder overrideConfigCmd = new StringBuilder(); if (cmExists) { // add/replace the content of NEW_CONF_DIR_PATH with all the files that comes from the config map overrideConfigCmd.append("cp -r "); overrideConfigCmd.append(cmMountPath); overrideConfigCmd.append("/..data/* "); overrideConfigCmd.append(NEW_CONF_DIR_PATH); if (!config.isEmpty()) { overrideConfigCmd.append(" ; "); } } if (!config.isEmpty()) { // override the key-value entries in the spark-defaults.conf overrideConfigCmd.append("echo -e \""); config.forEach(kv -> { overrideConfigCmd.append(kv.getName()); overrideConfigCmd.append(" "); overrideConfigCmd.append(kv.getValue()); overrideConfigCmd.append("\\n"); }); overrideConfigCmd.append("\" >> "); overrideConfigCmd.append(NEW_CONF_DIR_PATH); overrideConfigCmd.append("/spark-defaults.conf"); } // replace the content of $SPARK_HOME/conf with the newly created config files overrideConfigCmd.append(" && cp -r "); overrideConfigCmd.append(NEW_CONF_DIR_PATH); overrideConfigCmd.append("/* "); overrideConfigCmd.append(getSparkHome(cluster) + "/conf/"); Container overrideConfig = new ContainerBuilder() .withName("override-config") .withImage("busybox") .withImagePullPolicy("IfNotPresent") .withCommand("/bin/sh", "-xc") .withArgs(overrideConfigCmd.toString()) .withVolumeMounts(mounts) .build(); podSpec.getInitContainers().add(overrideConfig); podSpec.getContainers().get(0).getVolumeMounts().add(origConfMount); podSpec.getVolumes().add(origConfVolume); return overrideConfig; } private static String getSparkHome(SparkCluster cluster) { Predicate p = nv -> "SPARK_HOME".equals(nv.getName()); if (!cluster.getEnv().isEmpty() && cluster.getEnv().stream().anyMatch(p)) { Optional sparkHome = cluster.getEnv().stream().filter(p).findFirst(); if (sparkHome.isPresent() && null != sparkHome.get().getValue() && !sparkHome.get().getValue().trim().isEmpty()) { return sparkHome.get().getValue(); } } return DEFAULT_SPARK_HOME_PATH; } /** * Returns the cluster.getSparkConfigurationMap() if it's there. If not, it defaults to the * name of the spark cluster concatenated with '-config' suffix. * * @param cluster SparkCluster instance * @return expected name of the config map */ public static String getExpectedCMName(SparkCluster cluster) { return cluster.getSparkConfigurationMap() == null ? cluster.getName() + "-config" : cluster.getSparkConfigurationMap(); } /** * Calculates the expected initial delay for the liveness or readiness probe for master or worker * it considers these attributes: *
    *
  • if there is anything to download
  • *
  • if config map with overrides exists
  • *
  • if key-value config entries were passed in the custom resource/CM
  • *
  • cpu limit
  • *
* * Also worker node gets some minor penalisation, because its probe depends on the master's readiness. * * @param cluster SparkCluster instance * @param cmExists if config map with overrides exists * @param isMaster whether it is master or worker * @return expected time for initial delay for the probes */ public static int getExpectedDelay(SparkCluster cluster, boolean cmExists, boolean isMaster) { // todo: honor the chmod init cont. int delay = 6; if (isMaster) { if (null != cluster.getMaster() && null != cluster.getMaster().getCpu()) { try { double cpu = Double.parseDouble(cluster.getMaster().getCpu()); delay += (1.0 / cpu) * 3.5; } catch (NumberFormatException nfe) { // ignore } } delay += 0; } else { if (null != cluster.getWorker() && null != cluster.getWorker().getCpu()) { try { double cpu = Double.parseDouble(cluster.getWorker().getCpu()); delay += (1.0 / cpu) * 3.5; } catch (NumberFormatException nfe) { // ignore } } delay += 4; } delay += cmExists ? 3 : 0; delay += !cluster.getSparkConfiguration().isEmpty() ? 3 : 0; delay += cluster.getDownloadData().size() * 4; return delay; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy