All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.apex.malhar.stream.api.ApexStream Maven / Gradle / Ivy

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package org.apache.apex.malhar.stream.api;


import java.util.Map;
import java.util.concurrent.Callable;

import org.apache.apex.malhar.stream.api.function.Function;

import com.datatorrent.api.Attribute;
import com.datatorrent.api.Context.DAGContext;
import com.datatorrent.api.Context.OperatorContext;
import com.datatorrent.api.Context.PortContext;
import com.datatorrent.api.DAG;
import com.datatorrent.api.Operator;

/**
 * The stream interface to build a DAG
 * @param 
 *
 * @since 3.4.0
 */
public interface ApexStream
{
  /**
   * Simple map transformation
* Add an operator to the DAG which convert tuple T to tuple O * @param mapFunction map function * @param Type of the output * @return new stream of type O */ > STREAM map(Function.MapFunction mapFunction); /** * Simple map transformation
* Add an operator to the DAG which convert tuple T to tuple O * @param name operator name * @param mapFunction map function * @param Type of the output * @return new stream of type O */ > STREAM map(String name, Function.MapFunction mapFunction); /** * Flat map transformation * Add an operator to the DAG which convert tuple T to a collection of tuple O * @param flatten flat map * @param Type of the output * @return new stream of type O */ > STREAM flatMap(Function.FlatMapFunction flatten); /** * Flat map transformation
* Add an operator to the DAG which convert tuple T to a collection of tuple O * @param name operator name * @param flatten * @param Type of the output * @return new stream of type O */ > STREAM flatMap(String name, Function.FlatMapFunction flatten); /** * Filter transformation
* Add an operator to the DAG which filter out tuple T that cannot satisfy the FilterFunction * @param filter filter function * @return new stream of same type */ > STREAM filter(Function.FilterFunction filter); /** * Filter transformation
* Add an operator to the DAG which filter out tuple T that cannot satisfy the FilterFunction * @param name operator name * @param filter filter function * @return new stream of same type */ > STREAM filter(String name, Function.FilterFunction filter); /** * Reduce transformation
* Add an operator to the DAG which merge tuple t1, t2 to new tuple * @param reduce reduce function * @return new stream of same type */ > STREAM reduce(Function.ReduceFunction reduce); /** * Reduce transformation
* Add an operator to the DAG which merge tuple t1, t2 to new tuple * @param name operator name * @param reduce reduce function * @return new stream of same type */ > STREAM reduce(String name, Function.ReduceFunction reduce); /** * Fold transformation
* Add an operator to the DAG which merge tuple T to accumulated result tuple O * @param initialValue initial result value * @param fold fold function * @param Result type * @return new stream of type O */ > STREAM fold(O initialValue, Function.FoldFunction fold); /** * Fold transformation
* Add an operator to the DAG which merge tuple T to accumulated result tuple O * @param name name of the operator * @param initialValue initial result value * @param fold fold function * @param Result type * @return new stream of type O */ > STREAM fold(String name, O initialValue, Function.FoldFunction fold); /** * Count of all tuples * @return new stream of Integer */ > STREAM count(); /** * Count tuples by the key
* If the input is KeyedTuple it will get the key from getKey method from the tuple
* If not, use the tuple itself as a key * @return new stream of Map */ >> STREAM countByKey(); /** * * Count tuples by the indexed key * @param key the index of the field in the tuple that are used as key * @return new stream of Map */ >> STREAM countByKey(int key); /** * Extend the dag by adding one operator
* @param op Operator added to the stream * @param inputPort InputPort of the operator that is connected to last exposed OutputPort in the stream * @param outputPort OutputPort of the operator will be connected to next operator * @param type of the output * @return new stream of type O */ > STREAM addOperator(Operator op, Operator.InputPort inputPort, Operator.OutputPort outputPort); /** * Extend the dag by adding one {@see Operator} * @param opName Operator name * @param op Operator added to the stream * @param inputPort InputPort of the operator that is connected to last exposed OutputPort in the stream * @param outputPort OutputPort of the operator will be connected to next operator * @param type of the output * @return new stream of type O */ > STREAM addOperator(String opName, Operator op, Operator.InputPort inputPort, Operator.OutputPort outputPort); /** * Union multiple stream into one * @param others other streams * @return new stream of same type */ > STREAM union(ApexStream... others); /** * Add a stdout console output operator * @return stream itself */ > STREAM print(); /** * Add a stderr console output operator * @return stream itself */ > STREAM printErr(); /** * Set the attribute value
* If it is {@link DAGContext DAG attribute}, it will be applied to the whole DAG
* If it is {@link OperatorContext Operator attribute}, it will be applied to last connected operator
* If it is {@link PortContext InputPort attribute}, it will be applied to the input port of the last connected stream
* If it is {@link PortContext OutputPort attribute}, it will be applied to the output port of the last connected stream
* If it is both {@link PortContext InputPort&OutputPort attribute}, it will be applied to last connected stream * @param attribute {@see Attribute} * @param value value of the attribute * @return stream itself */ > STREAM with(Attribute attribute, Object value); /** * Set attributes at the DAG level * @param attribute {@see Attribute} * @param value value of the attribute * @return stream itself */ > STREAM setGlobalAttribute(Attribute attribute, Object value); /** * Set the locality * @param locality {@see DAG.Locality} * @return stream itself */ > STREAM with(DAG.Locality locality); /** * Set the property value of the last connected operator * @param propName property name * @param value value of the property * @return stream itself */ > STREAM with(String propName, Object value); /** * Create dag from stream * @return {@see DAG} */ DAG createDag(); /** * Populate existing dag * @param dag {@see DAG} */ void populateDag(DAG dag); /** * Run the stream application in local mode * In Async mode, the method would return immediately and the dag would run for "duration" milliseconds * In Sync mode, the method would block "duration" milliseconds to run the dag * If duration is negative the dag would run forever until being killed * @param async true if run in Async mode * false if run in sync mode */ void runEmbedded(boolean async, long duration, Callable exitCondition); /** * Submit the application to cluster */ void run(); }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy