All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.biojava.nbio.structure.basepairs.MismatchedBasePairParameters Maven / Gradle / Ivy

/*
 *                    BioJava development code
 *
 * This code may be freely distributed and modified under the
 * terms of the GNU Lesser General Public Licence.  This should
 * be distributed with the code.  If you do not have a copy,
 * see:
 *
 *      http://www.gnu.org/copyleft/lesser.html
 *
 * Copyright for this code is held jointly by the individual
 * authors.  These should be listed in @author doc comments.
 *
 * For more information on the BioJava project and its aims,
 * or to join the biojava-l mailing list, visit the home page
 * at:
 *
 *      http://www.biojava.org/
 *
 *
 */
package org.biojava.nbio.structure.basepairs;

import org.biojava.nbio.structure.Atom;
import org.biojava.nbio.structure.Chain;
import org.biojava.nbio.structure.Group;
import org.biojava.nbio.structure.Structure;
import org.biojava.nbio.structure.contact.Pair;

import javax.vecmath.Matrix4d;
import java.util.ArrayList;
import java.util.List;

/**
 * This class allows for finding inter-strand base pairs that are not necessarily canonical Watson-Crick pairs.
 * The implementation of findPair is different than that of the base class.  This class does not consider intra-strand
 * base pairing and for that, the TertiaryBasePairParameters class should be used.
 * @author Luke Czapla
 * @since 5.0.0
 *
 */
public class MismatchedBasePairParameters extends BasePairParameters {

	private static final long serialVersionUID = 2837124340169886674L;

	public static final double DEFAULT_MAX_STAGGER = 2.0;
	public static final double DEFAULT_MAX_PROPELLER = 60.0;
	public static final double DEFAULT_MAX_SHEAR = 5.0;
	public static final double DEFAULT_MAX_STRETCH = 5.0;

	// These are the criteria used to select proper base pairs.
	private double maxStagger = DEFAULT_MAX_STAGGER,
			maxShear = DEFAULT_MAX_SHEAR,
			maxStretch = DEFAULT_MAX_STRETCH,
			maxPropeller = DEFAULT_MAX_PROPELLER;

	/**
	 * This constructor is used to create the TertiaryBasePairParameters object.  The parent constructors are valid
	 * as well, but for this class, it makes the most sense to specify the exact parameters for the analysis.
	 * @param structure The Structure to analyze
	 * @param RNA Whether to analyze RNA (if false, it will analyze DNA)
	 * @param removeDups Whether to remove duplicate sequences (useful for RCSB data with redundant units).
	 * @param canonical Whether to only consider canonical Watson-Crick base pairs.  If false, any pairing will be identified
	 *                  as long it falls below the maximum values of stagger, shear, and stretch.
	 */
	public MismatchedBasePairParameters(Structure structure, boolean RNA, boolean removeDups, boolean canonical) {

		super(structure, RNA, removeDups, canonical);

	}

	/**
	 * This is an implementation for finding non-canonical base pairs when there may be missing or overhanging bases.
	 * @param chains The list of chains already found to be nucleic acids.
	 * @return The list of the atom groups (residues) that are pairs, as a Pair of nucleic acid Groups.
	 */
	@Override
	public List> findPairs(List chains) {
		List> result = new ArrayList<>();
		boolean lastFoundPair = false;
		for (int i = 0; i < chains.size(); i++) {
			Chain c = chains.get(i);
			String sequence = c.getAtomSequence();
			for (int m = 0; m < sequence.length(); m++) {
				boolean foundPair = false;
				Integer type1, type2;
				for (int j = i + 1; j < chains.size() && !foundPair; j++) {
					Chain c2 = chains.get(j);
					if (j > i+1 && c.getAtomSequence().equals(c2.getAtomSequence()) && nonredundant) continue;
					String sequence2 = c2.getAtomSequence();
					for (int k = c2.getAtomSequence().length() - 1; k >= 0 && !foundPair; k--) {
						if (canonical && !BasePairParameters.match(sequence.charAt(m), sequence2.charAt(k), useRNA)) continue;
						Group g1 = c.getAtomGroup(m);
						Group g2 = c2.getAtomGroup(k);
						type1 = BASE_MAP.get(g1.getPDBName());
						type2 = BASE_MAP.get(g2.getPDBName());
						if (type1 == null || type2 == null) continue;
						Atom a1 = g1.getAtom("C1'");
						Atom a2 = g2.getAtom("C1'");
						if (a1 == null || a2 == null) continue;
						// C1'-C1' distance is one useful criteria
						if (Math.abs(a1.getCoordsAsPoint3d().distance(a2.getCoordsAsPoint3d()) - 10.0) > 4.0) continue;
						Pair ga = new Pair<>(g1, g2);
						// TODO is this call needed?? JD 2018-03-07
						@SuppressWarnings("unused")
						Matrix4d data = basePairReferenceFrame(ga);
						// if the stagger is greater than 2 Å, it's not really paired.
						if (Math.abs(pairParameters[5]) > maxStagger) continue;
						// similarly, extreme shear and stretch is not a good base pair
						if (Math.abs(pairParameters[3]) > maxShear) continue;
						if (Math.abs(pairParameters[4]) > maxStretch) continue;

						// if the propeller is ridiculous it's also not that good of a pair.
						if (Math.abs(pairParameters[1]) > maxPropeller) {
							continue;
						}
						result.add(ga);
						pairingNames.add(useRNA ? BASE_LIST_RNA[type1] + BASE_LIST_RNA[type2] : BASE_LIST_DNA[type1] + BASE_LIST_DNA[type2]);
						foundPair = true;
					}
					if (!foundPair && lastFoundPair) {
						if (pairSequence.length() > 0 && pairSequence.charAt(pairSequence.length() - 1) != ' ')
							pairSequence += ' ';
					}
					if (foundPair) pairSequence += (c.getAtomSequence().charAt(i));
					lastFoundPair = foundPair;
				}
			}
		}
		return result;
	}

	/**
	 * This method returns the maximum stagger between bases used as criteria for the characterization of two bases as being paired.
	 * @return the maximum propeller ("propeller-twist", in degrees) allowed.
	 */
	public double getMaxStagger() {
		return maxStagger;
	}

	/**
	 * This method sets the maximum stagger allowed for a base pair, prior to analyze() call
	 * @param maxStagger The maximum propeller (in Å) allowed to consider two bases paired
	 */
	public void setMaxStagger(double maxStagger) {
		this.maxStagger = maxStagger;
	}

	/**
	 * This method returns the maximum shear between bases used as criteria for the characterization of two bases as being paired.
	 * @return the maximum shear (in Å) allowed.
	 */
	public double getMaxShear() {
		return maxShear;
	}

	/**
	 * This method sets the maximum shear allowed for a base pair, prior to analyze() call
	 * @param maxShear The maximum shear (in Å) allowed to consider two bases paired
	 */
	public void setMaxShear(double maxShear) {
		this.maxShear = maxShear;
	}

	/**
	 * This method returns the maximum stretch between bases used as criteria for the characterization of two bases as being paired.
	 * @return the maximum stretch (in Å) allowed.
	 */
	public double getMaxStretch() {
		return maxStretch;
	}

	/**
	 * This method sets the maximum stretch allowed for a base pair, prior to analyze() call.
	 * @param maxStretch The maximum stretch (in Å) allowed to consider two bases paired
	 */
	public void setMaxStretch(double maxStretch) {
		this.maxStretch = maxStretch;
	}

	/**
	 * This method returns the maximum propeller twist between bases used as criteria for the characterization of two bases as being paired.
	 * @return the maximum propeller ("propeller-twist", in degrees) allowed.
	 */
	public double getMaxPropeller() {
		return maxPropeller;
	}

	/**
	 * This method sets the maximum propeller allowed for a base pair, prior to analyze() call
	 * @param maxPropeller The maximum propeller ("propeller-twist", in degrees) allowed to consider two bases paired
	 */
	public void setMaxPropeller(double maxPropeller) {
		this.maxPropeller = maxPropeller;
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy