All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.datatorrent.lib.testbench.SeedEventClassifier Maven / Gradle / Ivy

/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package com.datatorrent.lib.testbench;

import java.util.HashMap;

import javax.validation.constraints.NotNull;

import com.datatorrent.api.Context.OperatorContext;
import com.datatorrent.api.DefaultInputPort;
import com.datatorrent.api.DefaultOutputPort;
import com.datatorrent.common.util.BaseOperator;

/**
 * This operator receives data on two input ports (data1, and data2). 
 * Each incoming tuple is given a seed value
 * and a key depending on which input port the tuple came from. 
 * Modified tuples are then emitted as strings on the string_data output port
 * and as maps on the hash_data output port.
 * 

*
* Examples of getting seed distributions include
* Changes in mobile co-ordinates of a phone
* Random changes on motion of an object
*
* The seed is created from the values of properties seed_start, and seed_end *
* Default schema:
* Schema for port data: The default schema is HashMap>, where valueData is class{String, Integer}
* String schema: The string is "key;valkey1:value1;valkey2:value2;..."
* HashMap schema: Key is String, and Value is a ArrrayList
* The value in both the schemas is an integer (for choice of strings, these are enum values) *
* Port Interface
* data1: Expects tuples of type
* data2: Expects tuples of type
* string_data: Emits new classified seed of schema String
* hash_data: Emits new classified seed of schema HashMap>
*
* Properties: * seed_start: An integer for the seed to start from
* seed_end: An integer for the seed to end with
*
string_schema: If set to true, operates in string schema mode
*
key: Classifier keys to be inserted in order for each incoming tuple. Format is "key1,key1start, key1end; key2, key2start, key2end;..." *
* Compile time checks are:
* seed_startHas to be an integer
* sedd_endHas to be an integer
* keyIf provided has to be in format "key1,key1start,key1end;key2, key2start, key2end; ..." *
* Benchmarks: Blast as many tuples as possible in inline mode
* String: Benchmarked at over 13 million tuples/second in local/in-line mode
* Integer: Benchmarked at over 7 million tuples/second in local/in-line mode
*

* @displayName Seed Event Classifier * @category Test Bench * @tags generate * @since 0.3.2 */ public class SeedEventClassifier extends BaseOperator { /** * An input port which receives incoming tuples. */ public final transient DefaultInputPort data1 = new DefaultInputPort() { @Override public void process(T tuple) { emitTuple(key1, tuple); } }; /** * An output port which receives incoming tuples. */ public final transient DefaultInputPort data2 = new DefaultInputPort() { @Override public void process(T tuple) { emitTuple(key2, tuple); } }; /** * An output port which emits modified tuples as a string. */ public final transient DefaultOutputPort string_data = new DefaultOutputPort(); /** * An output port which emits modified tuples as a hashmap. */ public final transient DefaultOutputPort>> hash_data = new DefaultOutputPort>>(); public void emitTuple(String key, T tuple) { if (string_data.isConnected()) { String str = Integer.toString(seed); str += ":"; str += key; str += ","; str += tuple.toString(); string_data.emit(str); } if (hash_data.isConnected()) { HashMap> hdata = new HashMap>(1); HashMap val = new HashMap(1); val.put(key, tuple); hdata.put(Integer.toString(seed), val); hash_data.emit(hdata); } seed++; if (seed == s_end) { seed = s_start; } } /** * Data for classification values */ HashMap keys = new HashMap(); @NotNull String key1 = new String(); @NotNull String key2 = new String(); int s_start = 0; int s_end = 99; int seed = 0; @NotNull public String getKey1() { return key1; } @NotNull public String getKey2() { return key2; } public void setSeedstart(int i) { s_start = i; } public void setSeedend(int i) { s_end = i; } public void setKey1(String i) { key1 = i; } public void setKey2(String i) { key2 = i; } @Override public void setup(OperatorContext context) { if (s_start > s_end) { int temp = s_end; s_end = s_start; s_start = temp; } seed = s_start; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy