com.github.heuermh.adam.plugins.JavaCountAlignmentsPerRead Maven / Gradle / Ivy
/**
* Copyright 2014 held jointly by the individual authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.github.heuermh.adam.plugins;
import java.io.Serializable;
import org.apache.avro.Schema;
import org.apache.spark.SparkContext;
import org.apache.spark.rdd.RDD;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.JavaRDD;
import org.apache.spark.api.java.function.Function;
import org.apache.spark.api.java.function.Function2;
import org.apache.spark.api.java.function.PairFunction;
import org.bdgenomics.adam.apis.java.JavaADAMContext;
import org.bdgenomics.adam.plugins.ADAMPlugin;
import org.bdgenomics.formats.avro.AlignmentRecord;
import scala.Function1;
import scala.Option;
import scala.Tuple2;
/**
* Count alignments per read implemented in Java.
*
* @author Michael Heuer
*/
public final class JavaCountAlignmentsPerRead extends JavaADAMPlugin> implements Serializable {
@Override
public JavaRDD> run(final JavaADAMContext ac, final JavaRDD recs, final String args) {
JavaRDD contigNames = recs.map(new Function() {
@Override
public CharSequence call(final AlignmentRecord rec) {
return rec.getReadMapped() ? rec.getReadName() : "unmapped";
}
});
JavaPairRDD counts = contigNames.mapToPair(new PairFunction() {
@Override
public Tuple2 call(final CharSequence readName) {
return new Tuple2(readName, Integer.valueOf(1));
}
});
JavaPairRDD reducedCounts = counts.reduceByKey(new Function2() {
@Override
public Integer call(final Integer value0, final Integer value1) {
return Integer.valueOf(value0.intValue() + value1.intValue());
}
});
// todo: seems like there should be a more direct way
return JavaRDD.fromRDD(reducedCounts.rdd(), null);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy