All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.dataartisans.flink.cascading.planner.FlinkFlow Maven / Gradle / Ivy

/*
 * Copyright 2015 data Artisans GmbH
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *  http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.dataartisans.flink.cascading.planner;

import cascading.flow.BaseFlow;
import cascading.flow.FlowDef;
import cascading.flow.FlowException;
import cascading.flow.FlowProcess;
import cascading.flow.hadoop.util.HadoopUtil;
import cascading.flow.planner.PlatformInfo;
import com.dataartisans.flink.cascading.runtime.util.FlinkFlowProcess;
import org.apache.flink.client.program.OptimizerPlanEnvironment;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.mapred.JobConf;
import riffle.process.ProcessComplete;
import riffle.process.ProcessConfiguration;

import java.io.IOException;
import java.util.HashMap;
import java.util.Map;

public class FlinkFlow extends BaseFlow {

	private Configuration config;

	public FlinkFlow(PlatformInfo platformInfo, FlowDef flowDef, Map properties, Configuration defaultConfig) {

		super(platformInfo, properties, defaultConfig, flowDef);
	}

	@Override
	protected void initConfig(Map properties, Configuration parentConfig) {
		if( properties != null ) {
			parentConfig = createConfig( properties, parentConfig );
		}

		if( parentConfig == null ) {
		// this is ok, getJobConf will pass a default parent in
			return;
		}

		config = HadoopUtil.copyJobConf(parentConfig);
	}


	@Override
	protected void setConfigProperty(Configuration config, Object key, Object value) {
		// don't let these objects pass, even though toString is called below.
		if( value instanceof Class || value instanceof JobConf || value instanceof Configuration) {
			return;
		}

		config.set(key.toString(), value.toString());
	}

	@Override
	protected Configuration newConfig(Configuration defaultConfig) {
		return defaultConfig == null ? new Configuration() : HadoopUtil.copyJobConf(defaultConfig);
	}

	@Override
	@ProcessComplete
	public void complete() {
		try {
			super.complete();
		}
		catch(FlowException fe) {
			// check if we need to unwrap a ProgramAbortException
			Throwable t = fe.getCause();
			if (t instanceof OptimizerPlanEnvironment.ProgramAbortException) {
				throw (OptimizerPlanEnvironment.ProgramAbortException)t;
			}
			else {
				throw fe;
			}
		}
	}

	@Override
	protected void internalStart() {
		try {
			deleteSinksIfReplace();
			deleteTrapsIfReplace();
			deleteCheckpointsIfReplace();
		}
		catch( IOException exception ) {
			throw new FlowException( "unable to delete sinks", exception );
		}
	}

	@Override
	protected void internalClean(boolean b) {
		// TODO: clean-up execution
	}

	@Override
	protected void internalShutdown() {
		// nothing to do?
	}

	@Override
	protected int getMaxNumParallelSteps() {
		return 1;
	}

	@Override
	public Configuration getConfig() {
		if( config == null ) {
			initConfig(null, new Configuration());
		}

		return config;
	}

	@ProcessConfiguration
	@Override
	public Configuration getConfigCopy() {
		return HadoopUtil.copyJobConf(getConfig());
	}

	@Override
	public Map getConfigAsProperties() {
		Map props = new HashMap();

		Configuration conf = getConfig();
		for(Map.Entry e : conf) {
			String key = e.getKey();
			props.put(key, conf.get(key));
		}

		return props;
	}

	@Override
	public String getProperty(String key) {
		return getConfig().get(key);

	}

	@Override
	public FlowProcess getFlowProcess() {
		return new FlinkFlowProcess(getFlowSession(), getConfig());
	}

	@Override
	public boolean stepsAreLocal() {
		return false;
	}


}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy