All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.flink.table.runtime.join.stream.state.JoinKeyContainPrimaryKeyStateHandler Maven / Gradle / Ivy

There is a newer version: 1.5.1
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copysecond ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.flink.table.runtime.join.stream.state;

import org.apache.flink.annotation.Internal;
import org.apache.flink.api.java.functions.KeySelector;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple3;
import org.apache.flink.runtime.state.keyed.KeyedValueState;
import org.apache.flink.table.dataformat.BaseRow;
import org.apache.flink.util.Preconditions;

import java.util.Collection;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.NoSuchElementException;
import java.util.Set;

/**
 * The state whose keys are joinKeys, and the values are {@link Tuple3}.
 */
@Internal
public class JoinKeyContainPrimaryKeyStateHandler implements JoinStateHandler {

	private final KeyedValueState keyedValueState;

	private final KeySelector keySelector;

	private transient BaseRow joinKey;

	// memState is used for miniBatch join, we can batch get different join key's value and put
	// in memState which can be used later
	private Map memState;

	public JoinKeyContainPrimaryKeyStateHandler(
			KeyedValueState keyedValueState,
			KeySelector keySelector) {
		this.keySelector = keySelector;
		this.keyedValueState = keyedValueState;
		this.memState = new HashMap<>();
	}

	@Override
	public void extractCurrentJoinKey(BaseRow row) throws Exception {
		this.joinKey = keySelector.getKey(row);
	}

	@Override
	public BaseRow getCurrentJoinKey() {
		return this.joinKey;
	}

	@Override
	public void extractCurrentPrimaryKey(BaseRow row) {

	}

	@Override
	public BaseRow getCurrentPrimaryKey() {
		return null;
	}

	@Override
	public long add(BaseRow row, long expireTime) {
		keyedValueState.put(joinKey, row);
		return 1;
	}

	@Override
	public long retract(BaseRow row) {
		keyedValueState.remove(joinKey);
		return 0;
	}

	@Override
	public Iterator> getRecords(BaseRow key) {
		return new Tuple3Iterator(keyedValueState, key);
	}

	@Override
	public Iterator> getRecordsFromCache(BaseRow key) {
		return new Tuple3MemIterator(memState, key);
	}

	@Override
	public boolean contains(BaseRow key, BaseRow row) {
		return keyedValueState.contains(key);
	}

	@Override
	public void update(BaseRow key, BaseRow row, long count, long expireTime) {
		keyedValueState.put(key, row);
	}

	@Override
	public void remove(BaseRow joinKey) {
		keyedValueState.remove(joinKey);
	}

	// batch operators
	public void batchGet(Collection keys) {
		memState = keyedValueState.getAll(keys);
	}

	@Override
	public long[] batchUpdate(BaseRow key, List> rows, long expireTime) {
		// Note: value state batchUpdate will do nothing, we use putAll to batch update data. Because
		// every key contains only one rows for value state.

		long [] updateStatus = new long[rows.size()];
		int idx = 0;
		// Here we only care last value, can always set update status to 1 if f1 > 0. In this
		// way, we will always update match state, but we can avoid pre-read join state value.
		// Since write is faster than read, it is valuable to do it.
		Tuple2 lastTuple = null;
		for (Tuple2 tuple2: rows) {
			lastTuple = tuple2;
			idx++;
		}
		if (lastTuple != null) {
			if (lastTuple.f1 < 0) {
				updateStatus[rows.size() - 1] = -1;
			} else if (lastTuple.f1 > 0) {
				updateStatus[rows.size() - 1] = 1;
			}
		}
		return updateStatus;
	}

	@Override
	public void putAll(Map putMap) {
		keyedValueState.putAll(putMap);
	}

	@Override
	public void removeAll(Set keys) {
		keyedValueState.removeAll(keys);
	}

	@Override
	public void setCurrentJoinKey(BaseRow row) {
		joinKey = row;
	}

	/**
	 * An iterator over the elements under the same joinKey which is backed by an
	 * iterator in the internal state.
	 */
	private class Tuple3Iterator implements Iterator> {
		private final KeyedValueState keyedValueState;
		private final Tuple3 reuse;
		private final BaseRow key;
		private BaseRow curentValue;
		private int count;

		@SuppressWarnings("unchecked")
		Tuple3Iterator(KeyedValueState keyedValueState, BaseRow key) {
			Preconditions.checkNotNull(keyedValueState);
			this.keyedValueState = keyedValueState;
			this.key = key;
			this.reuse = new Tuple3<>();
		}

		@Override
		public boolean hasNext() {
			if (count == 0 && keyedValueState.get(key) != null) {
				return true;
			} else {
				return false;
			}
		}

		@SuppressWarnings("unchecked")
		@Override
		public Tuple3 next() {
			if (count == 0) {
				curentValue = keyedValueState.get(key);
				if (curentValue != null) {
					reuse.f0 = curentValue;
					reuse.f1 = 1L;
					reuse.f2 = Long.MAX_VALUE;
					count++;
					return reuse;
				}
			}
			throw new NoSuchElementException();
		}

		@Override
		public void remove() {
			keyedValueState.remove(key);
		}
	}

	private class Tuple3MemIterator implements Iterator> {

		private final Map keyedValueState;
		private final Tuple3 reuse;
		private final BaseRow key;
		private BaseRow curentValue;
		private int count;

		@SuppressWarnings("unchecked")
		Tuple3MemIterator(Map keyedValueState, BaseRow key) {
			Preconditions.checkNotNull(keyedValueState);
			this.keyedValueState = keyedValueState;
			this.key = key;
			this.reuse = new Tuple3<>();
		}

		@Override
		public boolean hasNext() {
			if (count == 0 && keyedValueState.get(key) != null) {
				return true;
			} else {
				return false;
			}
		}

		@SuppressWarnings("unchecked")
		@Override
		public Tuple3 next() {
			if (count == 0) {
				curentValue = keyedValueState.get(key);
				if (curentValue != null) {
					reuse.f0 = curentValue;
					reuse.f1 = 1L;
					reuse.f2 = Long.MAX_VALUE;
					count++;
					return reuse;
				}
			}
			throw new NoSuchElementException();
		}

		@Override
		public void remove() {
			keyedValueState.remove(key);
		}
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy