All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.pharmgkb.parser.vcf.TransformingVcfLineParser Maven / Gradle / Ivy

package org.pharmgkb.parser.vcf;

import org.pharmgkb.parser.vcf.model.VcfMetadata;
import org.pharmgkb.parser.vcf.model.VcfPosition;
import org.pharmgkb.parser.vcf.model.VcfSample;

import javax.annotation.Nonnull;
import java.io.Closeable;
import java.io.IOException;
import java.io.PrintWriter;
import java.nio.file.Path;
import java.util.ArrayList;
import java.util.List;

/**
 * Applies a transformation to a VCF file.
 * This is a streaming {@link VcfLineParser} that applies a {@link VcfTransformation} and writes the VCF.
 * More generally, can apply to a single VCF stream a set of transformations and corresponding writers.
 * 

* Example: *

{@code
 *   VcfTransformation transformation1 = new VcfTransformation() {
 *       public void transformMetadata(VcfMetadata metadata) {
 *           metadata.getRawProperties().put("Test", "123"); // adds ##Test=123
 *       }
 *   };
 *   VcfTransformation transformation2 = new VcfTransformation() {
 *       public void transformDataLine(VcfMetadata metadata, VcfPosition position, List sampleData) {
 *           position.setQuality("0");
 *       }
 *   };
 *   TransformingVcfLineParser.Builder builder = new TransformingVcfLineParser.Builder();
 *   builder.addTransformation(transformation1, file1);
 *   builder.addTransformation(transformation2, file2);
 *   try (TransformingVcfLineParser lineParser = builder.build()) {
 *       try (VcfParser parser = new VcfParser.Builder().fromFile(input.toPath()).parseWith(transformer).build()) {
 *           parser.parse(); // prints transformed VCFs to file1 and file2
 *       }
 *   }
 * }
 * 
*/ public class TransformingVcfLineParser implements VcfLineParser, Closeable { private int m_lines; private List m_transformations; private List m_writers; private TransformingVcfLineParser(@Nonnull List transformations, @Nonnull List writer) { m_transformations = transformations; m_writers = writer; } public void parseLine(@Nonnull VcfMetadata metadata, @Nonnull VcfPosition position, @Nonnull List sampleData) { for (int i = 0; i < m_transformations.size(); i++) { // notice that this always happens before transformDataLine gets called // this means that transformDataLine can't change the metadata output if (m_lines == 0) { m_transformations.get(i).transformMetadata(metadata); m_writers.get(i).writeHeader(metadata); } boolean keep = m_transformations.get(i).transformDataLine(metadata, position, sampleData); if (keep) { m_writers.get(i).writeLine(metadata, position, sampleData); } } m_lines++; } @Override public void close() throws IOException { m_writers.forEach(org.pharmgkb.parser.vcf.VcfWriter::close); } public static class Builder { private List m_transformations = new ArrayList<>(); private List m_writers = new ArrayList<>(); @Nonnull public Builder addTransformation(@Nonnull VcfTransformation transformation, @Nonnull Path outputFile) throws IOException { m_transformations.add(transformation); m_writers.add(new VcfWriter.Builder().toFile(outputFile).build()); return this; } @Nonnull public Builder addTransformation(@Nonnull VcfTransformation transformation, @Nonnull PrintWriter writer) throws IOException { m_transformations.add(transformation); m_writers.add(new VcfWriter.Builder().toWriter(writer).build()); return this; } @Nonnull public Builder addTransformation(@Nonnull VcfTransformation transformation, @Nonnull VcfWriter writer) throws IOException { m_transformations.add(transformation); m_writers.add(writer); return this; } @Nonnull public TransformingVcfLineParser build() { if (m_transformations.isEmpty()) { throw new IllegalStateException("Must add at least one transformation"); } return new TransformingVcfLineParser(m_transformations, m_writers); } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy