picard.sam.markduplicates.util.LibraryIdGenerator Maven / Gradle / Ivy
/*
* The MIT License
*
* Copyright (c) 2014 The Broad Institute
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
* THE SOFTWARE.
*/
package picard.sam.markduplicates.util;
import htsjdk.samtools.SAMFileHeader;
import htsjdk.samtools.SAMReadGroupRecord;
import htsjdk.samtools.SAMRecord;
import htsjdk.samtools.util.Histogram;
import picard.sam.DuplicationMetrics;
import java.util.HashMap;
import java.util.Map;
import java.util.Optional;
/**
* A class to generate library Ids and keep duplication metrics by library IDs.
*
* @author nhomer
*/
public class LibraryIdGenerator {
private static final String UNKNOWN_LIBRARY = "Unknown Library";
private final SAMFileHeader header;
private final Map libraryIds = new HashMap(); // from library string to library id
private short nextLibraryId = 1;
private final Map metricsByLibrary = new HashMap();
private final Histogram opticalDuplicatesByLibraryId = new Histogram();
public LibraryIdGenerator(final SAMFileHeader header) {
this.header = header;
for (final SAMReadGroupRecord readGroup : header.getReadGroups()) {
final String library = LibraryIdGenerator.getReadGroupLibraryName(readGroup);
DuplicationMetrics metrics = metricsByLibrary.get(library);
if (metrics == null) {
metrics = new DuplicationMetrics();
metrics.LIBRARY = library;
metricsByLibrary.put(library, metrics);
}
}
}
public Map getLibraryIdsMap() { return this.libraryIds; }
public Map getMetricsByLibraryMap() { return this.metricsByLibrary; }
public Histogram getOpticalDuplicatesByLibraryIdMap() { return this.opticalDuplicatesByLibraryId; }
public static String getReadGroupLibraryName(SAMReadGroupRecord readGroup) {
return Optional.ofNullable(readGroup.getLibrary())
.orElse(UNKNOWN_LIBRARY);
}
/**
* Gets the library name from the header for the record. If the RG tag is not present on
* the record, or the library isn't denoted on the read group, a constant string is
* returned.
*/
public static String getLibraryName(final SAMFileHeader header, final SAMRecord rec) {
final String readGroupId = (String) rec.getAttribute("RG");
if (readGroupId != null) {
final SAMReadGroupRecord rg = header.getReadGroup(readGroupId);
if (rg != null) {
final String libraryName = rg.getLibrary();
if (null != libraryName) return libraryName;
}
}
return UNKNOWN_LIBRARY;
}
/** Get the library ID for the given SAM record. */
public short getLibraryId(final SAMRecord rec) {
final String library = getLibraryName(this.header, rec);
Short libraryId = this.libraryIds.get(library);
if (libraryId == null) {
libraryId = this.nextLibraryId++;
this.libraryIds.put(library, libraryId);
}
return libraryId;
}
public DuplicationMetrics getMetricsByLibrary(final String library) {
return this.metricsByLibrary.get(library);
}
public void addMetricsByLibrary(final String library, final DuplicationMetrics metrics) {
this.metricsByLibrary.put(library, metrics);
}
public long getNumberOfOpticalDuplicateClusters() {
return (long) this.opticalDuplicatesByLibraryId.getSumOfValues();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy