All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.davidbracewell.stream.JavaMPairStream Maven / Gradle / Ivy

There is a newer version: 0.5
Show newest version
/*
 * (c) 2005 David B. Bracewell
 *
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package com.davidbracewell.stream;

import com.davidbracewell.collection.Collect;
import com.davidbracewell.conversion.Cast;
import com.davidbracewell.function.*;
import com.davidbracewell.tuple.Tuple2;
import lombok.NonNull;

import java.io.Serializable;
import java.util.*;
import java.util.stream.Collectors;
import java.util.stream.Stream;

/**
 * @author David B. Bracewell
 */
public class JavaMPairStream implements MPairStream, Serializable {
  private static final long serialVersionUID = 1L;

  private final Stream> stream;


  public JavaMPairStream(Map map) {
    this(map.entrySet().stream());
  }

  public JavaMPairStream(Stream> stream) {
    this.stream = stream.map(Cast::as);
  }

  @Override
  public  MPairStream> join(MPairStream other) {
    Map> map = Cast.as(other.groupByKey().collectAsMap());
    return new JavaMPairStream<>(stream.flatMap(e -> {
      List>> list = new LinkedList<>();
      if (map.containsKey(e.getKey())) {
        map.get(e.getKey()).forEach(v -> list.add(Tuple2.of(e.getKey(), Tuple2.of(e.getValue(), v))));
      }
      return list.stream();
    }));
  }

  @Override
  public MPairStream reduceByKey(SerializableBinaryOperator operator) {
    return groupByKey().mapToPair((t, u) -> Tuple2.of(t, Collect.from(u).reduce(operator).orElse(null)));
  }


  @Override
  public void close() throws Exception {
    stream.close();
  }

  @Override
  public void forEach(@NonNull SerializableBiConsumer consumer) {
    stream.forEach(e -> {
      if (e == null) {
        consumer.accept(null, null);
      } else {
        consumer.accept(e.getKey(), e.getValue());
      }
    });
  }

  @Override
  public void forEachLocal(SerializableBiConsumer consumer) {
    stream.sequential().forEach(e -> {
      if (e == null) {
        consumer.accept(null, null);
      } else {
        consumer.accept(e.getKey(), e.getValue());
      }
    });
  }

  @Override
  public  MStream map(@NonNull SerializableBiFunction function) {
    return new JavaMStream<>(stream.map(e -> function.apply(e.getKey(), e.getValue())));
  }

  @Override
  public MPairStream> groupByKey() {
    return new JavaMPairStream<>(
      stream.collect(Collectors.groupingBy(Map.Entry::getKey))
        .entrySet()
        .stream()
        .map(e -> Tuple2.of(e.getKey(), e.getValue().stream().map(Map.Entry::getValue).collect(Collectors.toList())))
    );
  }

  @Override
  public  MPairStream mapToPair(SerializableBiFunction> function) {
    return new JavaMPairStream<>(stream.map(entry -> Cast.as(function.apply(entry.getKey(), entry.getValue()))));
  }

  @Override
  public MPairStream filter(SerializableBiPredicate predicate) {
    return new JavaMPairStream<>(stream.filter(e -> predicate.test(e.getKey(), e.getValue())));
  }

  @Override
  public Map collectAsMap() {
    return stream.collect(HashMap::new, (map, e) -> map.put(e.getKey(), e.getValue()), HashMap::putAll);
  }

  @Override
  public MPairStream filterByKey(SerializablePredicate predicate) {
    return new JavaMPairStream<>(stream.filter(e -> predicate.test(e.getKey())));
  }

  @Override
  public MPairStream filterByValue(SerializablePredicate predicate) {
    return new JavaMPairStream<>(stream.filter(e -> predicate.test(e.getValue())));
  }


  @Override
  public List> collectAsList() {
    return stream.map(Cast::>as).collect(Collectors.toList());
  }

  @Override
  public long count() {
    return stream.count();
  }

  @Override
  public MStream keys() {
    return new JavaMStream<>(stream.map(Map.Entry::getKey));
  }

  @Override
  public MPairStream sortByKey(SerializableComparator comparator) {
    return new JavaMPairStream<>(stream.sorted((o1, o2) -> comparator.compare(o1.getKey(), o2.getKey())));
  }

  @Override
  public MPairStream union(MPairStream other) {
    if (other instanceof SparkPairStream) {
      return Cast.as(other.union(Cast.as(this)));
    }
    return new JavaMPairStream<>(Stream.concat(stream, Cast.>as(other).stream));
  }

  @Override
  public MStream values() {
    return new JavaMStream<>(stream.map(Map.Entry::getValue));
  }

  @Override
  public MPairStream parallel() {
    return new JavaMPairStream<>(stream.parallel());
  }

  @Override
  public MPairStream shuffle(Random random) {
    return new JavaMPairStream<>(
      stream.map(t -> Tuple2.of(random.nextDouble(), t))
        .sorted(Map.Entry.comparingByKey())
        .map(Tuple2::getValue)
    );
  }
}//END OF JavaMPairStream