org.biojava.nbio.aaproperties.Constraints Maven / Gradle / Ivy
/*
* BioJava development code
*
* This code may be freely distributed and modified under the
* terms of the GNU Lesser General Public Licence. This should
* be distributed with the code. If you do not have a copy,
* see:
*
* http://www.gnu.org/copyleft/lesser.html
*
* Copyright for this code is held jointly by the individual
* authors. These should be listed in @author doc comments.
*
* For more information on the BioJava project and its aims,
* or to join the biojava-l mailing list, visit the home page
* at:
*
* http://www.biojava.org/
*
*/
package org.biojava.nbio.aaproperties;
import org.biojava.nbio.aaproperties.PeptideProperties.SingleLetterAACode;
import org.biojava.nbio.core.sequence.compound.AminoAcidCompound;
import org.biojava.nbio.core.sequence.compound.AminoAcidCompoundSet;
import java.util.HashMap;
import java.util.Map;
/**
* This class is used to support the implementation of properties stated in IPeptideProperties.
* It initializes several values that would be needed for the computation of properties such as
*
* Molecular weight
* Instability index
* Hydropathy value
* pKa
*
* @author kohchuanhock
* @version 2011.05.21
* @see IPeptideProperties
*/
public class Constraints {
private static AminoAcidCompoundSet aaSet = new AminoAcidCompoundSet();
//A, R, N, D, C, E, Q, G, H, I, L, K, M, F, P, S, T, W, Y, V
public static AminoAcidCompound A = aaSet.getCompoundForString("A");
public static AminoAcidCompound R = aaSet.getCompoundForString("R");
public static AminoAcidCompound N = aaSet.getCompoundForString("N");
public static AminoAcidCompound D = aaSet.getCompoundForString("D");
public static AminoAcidCompound C = aaSet.getCompoundForString("C");
public static AminoAcidCompound E = aaSet.getCompoundForString("E");
public static AminoAcidCompound Q = aaSet.getCompoundForString("Q");
public static AminoAcidCompound G = aaSet.getCompoundForString("G");
public static AminoAcidCompound H = aaSet.getCompoundForString("H");
public static AminoAcidCompound I = aaSet.getCompoundForString("I");
public static AminoAcidCompound L = aaSet.getCompoundForString("L");
public static AminoAcidCompound K = aaSet.getCompoundForString("K");
public static AminoAcidCompound M = aaSet.getCompoundForString("M");
public static AminoAcidCompound F = aaSet.getCompoundForString("F");
public static AminoAcidCompound P = aaSet.getCompoundForString("P");
public static AminoAcidCompound S = aaSet.getCompoundForString("S");
public static AminoAcidCompound T = aaSet.getCompoundForString("T");
public static AminoAcidCompound W = aaSet.getCompoundForString("W");
public static AminoAcidCompound Y = aaSet.getCompoundForString("Y");
public static AminoAcidCompound V = aaSet.getCompoundForString("V");
public static Map aa2ExtinctionCoefficient = new HashMap();
public static Map aa2MolecularWeight = new HashMap();
public static Map aa2Hydrophathicity = new HashMap();
public static Map aa2PKa = new HashMap();
public static Map diAA2Instability = new HashMap();
public static Map aa2NTerminalPka = new HashMap();
public static Map aa2CTerminalPka = new HashMap();
static{
initMolecularWeight();
initHydropathicity();
initPKa();
initInstability();
initExtinctionCoefficient();
}
/**
* Does the initialization of molecular weights based on http://au.expasy.org/tools/findmod/findmod_masses.html#AA
*/
public static void initMolecularWeight(){
// Alanine (A) 71.03711 71.0788
aa2MolecularWeight.put(A, 71.0788);
// Arginine (R) 156.10111 156.1875
aa2MolecularWeight.put(R, 156.1875);
// Asparagine (N) 114.04293 114.1038
aa2MolecularWeight.put(N, 114.1038);
// Aspartic acid (D) 115.02694 115.0886
aa2MolecularWeight.put(D, 115.0886);
// Cysteine (C) 103.00919 103.1388
aa2MolecularWeight.put(C, 103.1388);
// Glutamic acid (E) 129.04259 129.1155
aa2MolecularWeight.put(E, 129.1155);
// Glutamine (Q) 128.05858 128.1307
aa2MolecularWeight.put(Q, 128.1307);
// Glycine (G) 57.02146 57.0519
aa2MolecularWeight.put(G, 57.0519);
// Histidine (H) 137.05891 137.1411
aa2MolecularWeight.put(H, 137.1411);
// Isoleucine (I) 113.08406 113.1594
aa2MolecularWeight.put(I, 113.1594);
// Leucine (L) 113.08406 113.1594
aa2MolecularWeight.put(L, 113.1594);
// Lysine (K) 128.09496 128.1741
aa2MolecularWeight.put(K, 128.1741);
// Methionine (M) 131.04049 131.1926
aa2MolecularWeight.put(M, 131.1926);
// Phenylalanine (F) 147.06841 147.1766
aa2MolecularWeight.put(F, 147.1766);
// Proline (P) 97.05276 97.1167
aa2MolecularWeight.put(P, 97.1167);
// Serine (S) 87.03203 87.0782
aa2MolecularWeight.put(S, 87.0782);
// Threonine (T) 101.04768 101.1051
aa2MolecularWeight.put(T, 101.1051);
// Tryptophan (W) 186.07931 186.2132
aa2MolecularWeight.put(W, 186.2132);
// Tyrosine (Y) 163.06333 163.1760
aa2MolecularWeight.put(Y, 163.1760);
// Valine (V) 99.06841 99.1326
aa2MolecularWeight.put(V, 99.1326);
}
/**
* Does the initialization of hydropathicity based on http://web.expasy.org/protscale/pscale/Hphob.Doolittle.html
*/
private static void initHydropathicity(){
// Ala(A): 1.800
aa2Hydrophathicity.put(A, 1.800);
// Arg(R): -4.500
aa2Hydrophathicity.put(R, -4.500);
// Asn(N): -3.500
aa2Hydrophathicity.put(N, -3.500);
// Asp(D): -3.500
aa2Hydrophathicity.put(D, -3.500);
// Cys(C): 2.500
aa2Hydrophathicity.put(C, 2.500);
// Gln(E): -3.500
aa2Hydrophathicity.put(E, -3.500);
// Glu(Q): -3.500
aa2Hydrophathicity.put(Q, -3.500);
// Gly(G): -0.400
aa2Hydrophathicity.put(G, -0.400);
// His(H): -3.200
aa2Hydrophathicity.put(H, -3.200);
// Ile(I): 4.500
aa2Hydrophathicity.put(I, 4.500);
// Leu(L): 3.800
aa2Hydrophathicity.put(L, 3.800);
// Lys(K): -3.900
aa2Hydrophathicity.put(K, -3.900);
// Met(M): 1.900
aa2Hydrophathicity.put(M, 1.900);
// Phe(F): 2.800
aa2Hydrophathicity.put(F, 2.800);
// Pro(P): -1.600
aa2Hydrophathicity.put(P, -1.600);
// Ser(S): -0.800
aa2Hydrophathicity.put(S, -0.800);
// Thr(T): -0.700
aa2Hydrophathicity.put(T, -0.700);
// Trp(W): -0.900
aa2Hydrophathicity.put(W, -0.900);
// Tyr(Y): -1.300
aa2Hydrophathicity.put(Y, -1.300);
// Val(V): 4.200
aa2Hydrophathicity.put(V, 4.200);
}
/**
* Does the initialization of PKa based on
* http://www.innovagen.se/custom-peptide-synthesis/peptide-property-calculator/peptide-property-calculator-notes.asp#NetCharge
*/
private static void initPKaInnovagen(){
/*
* A.Lehninger, Principles of Biochemistry, 4th Edition (2005), Chapter 3, page78, Table 3-1.
*/
//(NH2-) 9.69 (-COOH) 2.34
aa2CTerminalPka.put(G, 2.34);
aa2CTerminalPka.put(A, 2.34);
aa2CTerminalPka.put(P, 1.99);
aa2CTerminalPka.put(V, 2.32);
aa2CTerminalPka.put(L, 2.36);
aa2CTerminalPka.put(I, 2.36);
aa2CTerminalPka.put(M, 2.28);
aa2CTerminalPka.put(F, 1.83);
aa2CTerminalPka.put(Y, 2.20);
aa2CTerminalPka.put(W, 2.38);
aa2CTerminalPka.put(S, 2.21);
aa2CTerminalPka.put(T, 2.11);
aa2CTerminalPka.put(C, 1.96);
aa2CTerminalPka.put(N, 2.02);
aa2CTerminalPka.put(Q, 2.17);
aa2CTerminalPka.put(K, 2.18);
aa2CTerminalPka.put(H, 1.82);
aa2CTerminalPka.put(R, 2.17);
aa2CTerminalPka.put(D, 1.88);
aa2CTerminalPka.put(E, 2.19);
aa2NTerminalPka.put(G, 9.60);
aa2NTerminalPka.put(A, 9.69);
aa2NTerminalPka.put(P, 10.96);
aa2NTerminalPka.put(V, 9.62);
aa2NTerminalPka.put(L, 9.60);
aa2NTerminalPka.put(I, 9.68);
aa2NTerminalPka.put(M, 9.21);
aa2NTerminalPka.put(F, 9.13);
aa2NTerminalPka.put(Y, 9.11);
aa2NTerminalPka.put(W, 9.39);
aa2NTerminalPka.put(S, 9.15);
aa2NTerminalPka.put(T, 9.62);
aa2NTerminalPka.put(C, 10.28);
aa2NTerminalPka.put(N, 8.80);
aa2NTerminalPka.put(Q, 9.13);
aa2NTerminalPka.put(K, 8.95);
aa2NTerminalPka.put(H, 9.17);
aa2NTerminalPka.put(R, 9.04);
aa2NTerminalPka.put(D, 9.60);
aa2NTerminalPka.put(E, 9.67);
// K, Lys 10.53
aa2PKa.put(K, 10.53);
// D, Asp 3.65
aa2PKa.put(D, 3.65);
// R, Arg 12.48
aa2PKa.put(R, 12.48);
// E, Glu 4.25
aa2PKa.put(E, 4.25);
// H, His 6.00
aa2PKa.put(H, 6.00);
// C, Cys 8.18
aa2PKa.put(C, 8.18);
// Y, Tyr 10.07
aa2PKa.put(Y, 10.07);
}
private static void initPKa(){
initPKaInnovagen();
}
/**
* Does the initialization of dipeptide instability index based on the following paper
*
* Guruprasad, K., Reddy, B.V.B. and Pandit, M.W. (1990)
* Correlation between stability of a protein and its dipeptide composition: a novel approach for predicting in vivo stability of a protein from its primary sequence.
* Protein Eng. 4,155-161. Table III.
*/
private static void initInstability(){
double[][] instability = {
//W C M H Y F Q N I R D P T K E V S G A L
{1.0, 1.0, 24.68, 24.68, 1.0, 1.0, 1.0, 13.34, 1.0, 1.0, 1.0, 1.0, -14.03, 1.0, 1.0, -7.49, 1.0, -9.37, -14.03, 13.34},
{24.68, 1.0, 33.6, 33.6, 1.0, 1.0, -6.54, 1.0, 1.0, 1.0, 20.26, 20.26, 33.6, 1.0, 1.0, -6.54, 1.0, 1.0, 1.0, 20.26},
{1.0, 1.0, -1.88, 58.28, 24.68, 1.0, -6.54, 1.0, 1.0, -6.54, 1.0, 44.94, -1.88, 1.0, 1.0, 1.0, 44.94, 1.0, 13.34, 1.0},
{-1.88, 1.0, 1.0, 1.0, 44.94, -9.37, 1.0, 24.68, 44.94, 1.0, 1.0, -1.88, -6.54, 24.68, 1.0, 1.0, 1.0, -9.37, 1.0, 1.0},
{-9.37, 1.0, 44.94, 13.34, 13.34, 1.0, 1.0, 1.0, 1.0, -15.91, 24.68, 13.34, -7.49, 1.0, -6.54, 1.0, 1.0, -7.49, 24.68, 1.0},
{1.0, 1.0, 1.0, 1.0, 33.6, 1.0, 1.0, 1.0, 1.0, 1.0, 13.34, 20.26, 1.0, -14.03, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0},
{1.0, -6.54, 1.0, 1.0, -6.54, -6.54, 20.26, 1.0, 1.0, 1.0, 20.26, 20.26, 1.0, 1.0, 20.26, -6.54, 44.94, 1.0, 1.0, 1.0},
{-9.37, -1.88, 1.0, 1.0, 1.0, -14.03, -6.54, 1.0, 44.94, 1.0, 1.0, -1.88, -7.49, 24.68, 1.0, 1.0, 1.0, -14.03, 1.0, 1.0},
{1.0, 1.0, 1.0, 13.34, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, -1.88, 1.0, -7.49, 44.94, -7.49, 1.0, 1.0, 1.0, 20.26},
{58.28, 1.0, 1.0, 20.26, -6.54, 1.0, 20.26, 13.34, 1.0, 58.28, 1.0, 20.26, 1.0, 1.0, 1.0, 1.0, 44.94, -7.49, 1.0, 1.0},
{1.0, 1.0, 1.0, 1.0, 1.0, -6.54, 1.0, 1.0, 1.0, -6.54, 1.0, 1.0, -14.03, -7.49, 1.0, 1.0, 20.26, 1.0, 1.0, 1.0},
{-1.88, -6.54, -6.54, 1.0, 1.0, 20.26, 20.26, 1.0, 1.0, -6.54, -6.54, 20.26, 1.0, 1.0, 18.38, 20.26, 20.26, 1.0, 20.26, 1.0},
{-14.03,1.0, 1.0, 1.0, 1.0, 13.34, -6.54, -14.03, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 20.26, 1.0, 1.0, -7.49, 1.0, 1.0},
{1.0, 1.0, 33.6, 1.0, 1.0, 1.0, 24.68, 1.0, -7.49, 33.6, 1.0, -6.54, 1.0, 1.0, 1.0, -7.49, 1.0, -7.49, 1.0, -7.49},
{-14.03,44.94, 1.0, -6.54, 1.0, 1.0, 20.26, 1.0, 20.26, 1.0, 20.26, 20.26, 1.0, 1.0, 33.6, 1.0, 20.26, 1.0, 1.0, 1.0},
{1.0, 1.0, 1.0, 1.0, -6.54, 1.0, 1.0, 1.0, 1.0, 1.0, -14.03, 20.26, -7.49, -1.88, 1.0, 1.0, 1.0, -7.49, 1.0, 1.0},
{1.0, 33.6, 1.0, 1.0, 1.0, 1.0, 20.26, 1.0, 1.0, 20.26, 1.0, 44.94, 1.0, 1.0, 20.26, 1.0, 20.26, 1.0, 1.0, 1.0},
{13.34, 1.0, 1.0, 1.0, -7.49, 1.0, 1.0, -7.49, -7.49, 1.0, 1.0, 1.0, -7.49, -7.49, -6.54, 1.0, 1.0, 13.34, -7.49, 1.0},
{1.0, 44.94, 1.0, -7.49, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, -7.49, 20.26, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0},
{24.68, 1.0, 1.0, 1.0, 1.0, 1.0, 33.6, 1.0, 1.0, 20.26, 1.0, 20.26, 1.0, -7.49, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0}
};
SingleLetterAACode[] aa = SingleLetterAACode.values();
for(int i = 0; i < aa.length; i++){
for(int j = 0; j < aa.length; j++){
diAA2Instability.put("" + aa[i] + aa[j], instability[i][j]);
}
}
}
/**
* Does the initialization of extinction coefficient based on
* http://au.expasy.org/tools/protparam-doc.html
*/
public static void initExtinctionCoefficient(){
aa2ExtinctionCoefficient.put(Y, 1490.0);
aa2ExtinctionCoefficient.put(W, 5500.0);
aa2ExtinctionCoefficient.put(C, 125.0);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy