All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.actelion.research.chem.SSSearcher Maven / Gradle / Ivy

There is a newer version: 2024.12.1
Show newest version
/*
* Copyright (c) 1997 - 2016
* Actelion Pharmaceuticals Ltd.
* Gewerbestrasse 16
* CH-4123 Allschwil, Switzerland
*
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice, this
*    list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright notice,
*    this list of conditions and the following disclaimer in the documentation
*    and/or other materials provided with the distribution.
* 3. Neither the name of the the copyright holder nor the
*    names of its contributors may be used to endorse or promote products
*    derived from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
* ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
*/

package com.actelion.research.chem;

import com.actelion.research.util.IntArrayComparator;

import java.util.*;

public class SSSearcher {
	// CONSTANTS TO DEFINE KIND OF SIMILARITY BETWEEN ATOMS AND BONDS
	public final static int cMatchAtomCharge = 1;
	public final static int cMatchAtomMass = 2;
	public final static int cMatchDBondToDelocalized = 4;
	public final static int cMatchAromDBondToDelocalized = 8;

/*	For index match modes we need to consider the following:
  - If fragment C is SS of fragment B and B is SS of molecule A then C must be SS of A.
	This implies that if X is SS of Y then X is in all respects equal or less exactly
	defined as Y. Consequently, if the SS operator matches any double bonds to aromatic
	double bonds and matches aromatic double bonds to delocaliced bonds, it must match
	any double bond to delocalized bonds (cMatchAromDBondToDelocalized cannot be used for
	index creation). Example: key C=C-N-C=C, query pyrol, molecule indole, key would match
	pyrol but not indol!!!
  - match modes used for the actual atom by atom check must be more or equally restrictive
	than the match mode used for index creation. Otherwise index keys may filter out
	molecules which would be considered a match with the less strict matching consitions
	of the atom by atom check.
*/

									// match mode to be used for index creation
	public static final int cIndexMatchMode = cMatchDBondToDelocalized;
	public static final int cDefaultMatchMode = cMatchAromDBondToDelocalized;

	public final static int cCountModeExistance		= 1;
	public final static int cCountModeFirstMatch	= 2;
	public final static int cCountModeSeparated		= 3;
	public final static int cCountModeOverlapping	= 4;
	public final static int cCountModeRigorous		= 5;

	// default behaviour for unusual atom masses and atom charges is that
	// - if no atom charge/mass is specified in the query then all charges/masses match
	// - if an atom charge/mass is specified then this charge/mass must match for the atom to match

	// defines details of similarity between atoms and bonds
	private int mDefaultMatchMode;

	// The molecule which is analyzed
	protected StereoMolecule mMolecule;

	// The sub-structure we try to find in the molecule
	protected StereoMolecule mFragment;

	private int[] mMoleculeAtomType;	// atom features required to match
	private int[] mFragmentAtomType;
	private int[] mMoleculeAtomFeatures;	// flags defining given/required atom features
	private int[] mFragmentAtomFeatures;
	private int[] mMoleculeBondFeatures;	// flags defining given/required bond features
	private int[] mFragmentBondFeatures;

	private int mFragmentExcludeAtoms,mFragmentExcludeBonds;
	private int mFragmentGraphSize;	// the number of wanted atoms & ring closures in fragment graph
	private int mFragmentGraphSizeWithExcludeGroups;	// total number of atoms & ring closures in fragment graph
	private int[] mFragmentGraphAtom;
	private int[] mFragmentGraphParentAtom;
	private int[] mFragmentGraphParentBond;
	private boolean[] mFragmentGraphIsRingClosure;
	private boolean[] mIsExcludeAtom;
	private int[] mFragmentConnAtoms;	// in case of exclude atoms, these are not part of this
	private int[] mMatchTable;
	private int[] mExcludeGroupNo;
	private int[] mExcludeGroupGraphIndex;

	// depending on the fragment count mode this may contain atom lists
	// of all till now located matching sub-fragments
	private TreeSet mSortedMatchSet;
	private ArrayList mMatchList;
	private ArrayList mBridgeBondList;

	private boolean mMoleculeFeaturesValid;
	private boolean mFragmentFeaturesValid;
	private int mRequiredHelperLevel;
	private int mExcludeGroupCount;

	/**
	 * Instantiates a SSSearcher object for running sub-structure searches
	 * with one or more sub-structure fragments on one or more molecules.
	 * The search is a pure graph matching algorithm.
	 * For fast sub-structure searches involving an index based pre-screening use the class SSSearcherWithIndex.
	 * For a more high-level structure search supporting multiple cores, sub-structure-, similarity-,
	 * exact-, or tautomer-search use class StructureSearch and related classes.
	 */
	public SSSearcher() {
		mDefaultMatchMode = cDefaultMatchMode;
		mMatchList = new ArrayList();
		mSortedMatchSet = new TreeSet(new IntArrayComparator());
		}


	/**
	 * Instantiates a SSSearcher object for running sub-structure searches
	 * with one or more sub-structure fragments on one or more molecules.
	 * The search is a pure graph matching algorithm.
	 * For fast sub-structure searches involving an index based pre-screening use the class SSSearcherWithIndex.
	 * For a more high-level structure search supporting multiple cores, sub-structure-, similarity-,
	 * exact-, or tautomer-search use class StructureSearch and related classes.
	 * @param matchMode combination of cMatchAtomCharge, cMatchAtomMass, cMatchDBondToDelocalized, cMatchAromDBondToDelocalized
	 */
	public SSSearcher(int matchMode) {
		mDefaultMatchMode = matchMode;
		mMatchList = new ArrayList();
		mSortedMatchSet = new TreeSet(new IntArrayComparator());
		}


	/**
	 * Defines fragment and molecule before calling isFragmentInMolecule(...)
	 * or findFragmentInMolecule(...).
	 * @param fragment
	 * @param molecule
	 */
	public void setMol(StereoMolecule fragment, StereoMolecule molecule) {
		setMolecule(molecule);
		setFragment(fragment);
		}


	/**
	 * Defines the molecule to be used in isFragmentInMolecule(...)
	 * or findFragmentInMolecule(...).
	 * @param molecule
	 */
	public void setMolecule(StereoMolecule molecule) {
		if (molecule == null || molecule.getAllAtoms() == 0) {
			mMolecule = null;
			return;
			}

		mMolecule = molecule;
		mMoleculeFeaturesValid = false;
		mMolecule.ensureHelperArrays(Molecule.cHelperNeighbours);
		}


	/**
	 * Defines the fragment to be used in isFragmentInMolecule(...)
	 * or findFragmentInMolecule(...).
	 * @param fragment
	 */
	public void setFragment(StereoMolecule fragment) {
		if (fragment == null || fragment.getAllAtoms() == 0 || !fragment.isFragment()) {
			mFragment = null;
			return;
			}

		mFragment = fragment;
		mFragmentFeaturesValid = false;
		mFragment.ensureHelperArrays(Molecule.cHelperNeighbours);

		mRequiredHelperLevel = Molecule.cHelperRings;
		for (int atom=0; atom
	 * - it is not equal to the parent of the current graph atom and
* - if the bond to the candidate is not a bridge bond
* - if the bond was not added to the graph already
* then attach the candidate to the graph and mark, whether it is a ring closure (and therefore duplicate). * @param current * @param highest * @param i connAtom index of current graph atom * @param fragmentAtomUsed * @param fragmentBondUsed * @return */ private int tryAddCandidate(int current, int highest, int i, boolean[] fragmentAtomUsed, boolean[] fragmentBondUsed, int excludeGroupNo) { int candidate = mFragment.getConnAtom(mFragmentGraphAtom[current], i); if ((!mIsExcludeAtom[candidate] || mExcludeGroupNo[candidate] == excludeGroupNo) // always allow non-exclude atoms, because it may be a ring closure from exclude group to main fragment && candidate != mFragmentGraphParentAtom[current]) { int candidateBond = mFragment.getConnBond(mFragmentGraphAtom[current], i); if (!fragmentBondUsed[candidateBond] // if it is a ring closure make sure it is added only once && !mFragment.isBondBridge(candidateBond)) { // don't consider bridge bonds at this state mFragmentGraphAtom[++highest] = candidate; mFragmentGraphParentAtom[highest] = mFragmentGraphAtom[current]; mFragmentGraphParentBond[highest] = candidateBond; fragmentBondUsed[candidateBond] = true; if (fragmentAtomUsed[candidate]) mFragmentGraphIsRingClosure[highest] = true; else fragmentAtomUsed[candidate] = true; } } return highest; } /** * If the match count mode is one of cCountModeFirstMatch, cCountModeOverlapping, * cCountModeRigorous then this method returns an arraylist of all counted matches, * i.e. int arrays mapping fragment atoms to molecule atoms. Atoms being part of a * matched bridge bond are naturally not covered by the mapping.
* Note: If some query fragment atoms are marked as exclude group, then the respective * matchlist values are -1. * @return list of distinct counted matches. */ public ArrayList getMatchList() { return mMatchList; } /** * Fastest check, whether the molecule contains the fragment. * This method uses cCountModeExistance and therefore does not create * any retrievable match list, i.e. mapping from fragment atoms to molecule atoms. * The match mode used is cDefaultMatchMode, unless defined otherwise when * instantiating the SSSearcher. * @return whether fragment was found as sub-structure in molecule */ public boolean isFragmentInMolecule() { return (findFragmentInMolecule(cCountModeExistance, mDefaultMatchMode) > 0); } /** * Fastest check, whether the molecule contains the fragment. * This method uses cCountModeExistance and therefore does not create * any retrievable match list, i.e. mapping from fragment atoms to molecule atoms. * @param matchMode cDefaultMatchMode or combination of cMatchAtomCharge, cMatchAtomMass, cMatchDBondToDelocalized, cMatchAromDBondToDelocalized * @return whether fragment was found as sub-structure in molecule */ public boolean isFragmentInMolecule(int matchMode) { return (findFragmentInMolecule(cCountModeExistance, matchMode) > 0); } /** * Locates all matches of the fragment in the molecule that result in distinguishable * sets of molecule atoms. Multiple matches involving the same atoms, e.g. with a benzene ring, * are counted and listed only once. Atom mapping from fragment to molecule * is collected and can be retrieved with getMatchList(). * @return count of sub-structure matches of fragment in molecule */ public int findFragmentInMolecule() { return findFragmentInMolecule(cCountModeOverlapping, mDefaultMatchMode); } /** * Locates all matches of the fragment in the molecule that result in distinguishable * sets of molecule atoms. Multiple matches involving the same atoms, e.g. with a benzene ring, * are counted and listed only once. If count mode is different from cCountModeExistance, * then an atom mapping from fragment to molecule is collected and can be retrieved with getMatchList(). * @param countMode one of cCountModeExistance, cCountModeFirstMatch, cCountModeOverlapping, cCountModeRigorous * @param matchMode cDefaultMatchMode or combination of cMatchAtomCharge, cMatchAtomMass, cMatchDBondToDelocalized, cMatchAromDBondToDelocalized * @return count of sub-structure matches of fragment in molecule */ public int findFragmentInMolecule(int countMode, int matchMode) { return findFragmentInMolecule(countMode, matchMode, null); } /** * Locates all matches of the fragment in the molecule that result in distinguishable * sets of molecule atoms that are not flagged to be excluded from matching. * Multiple matches involving the same atoms, e.g. with a benzene ring, * are counted and listed only once. If count mode is different from cCountModeExistance, * then an atom mapping from fragment to molecule is collected and can be retrieved with getMatchList(). * If the query fragment does not contain atoms other than exclude group atoms, then no match is returned. * @param countMode one of cCountModeExistance, cCountModeFirstMatch, cCountModeOverlapping, cCountModeRigorous * @param matchMode cDefaultMatchMode or combination of cMatchAtomCharge, cMatchAtomMass, cMatchDBondToDelocalized, cMatchAromDBondToDelocalized * @param atomExcluded defines atoms of molecule to be excluded from sub-structure matching * @return count of sub-structure matches of fragment in molecule */ public int findFragmentInMolecule(int countMode, int matchMode, final boolean[] atomExcluded) { mMatchList = new ArrayList(); mSortedMatchSet.clear(); if (mMolecule == null || mFragment == null) return 0; if (mFragment.getAtoms() - mFragmentExcludeAtoms > mMolecule.getAtoms() || mFragment.getBonds() - mFragmentExcludeBonds > mMolecule.getBonds()) return 0; if (mFragment.getAtoms() == 0) return 0; /* System.out.print(" molecule:"); for (int i=0; i= mMolecule.getAtoms()) continue; int candidate = mMolecule.getConnAtom(mMatchTable[mFragmentGraphParentAtom[current]], index[current]); if (!mFragmentGraphIsRingClosure[current]) { // current graph position is not an anchor if (!atomUsed[candidate]) { if (areAtomsSimilar(candidate, mFragmentGraphAtom[current]) && areBondsSimilar(mMolecule.getConnBond(mMatchTable[mFragmentGraphParentAtom[current]], index[current]), mFragmentGraphParentBond[current])) { atomUsed[candidate] = true; mMatchTable[mFragmentGraphAtom[current]] = candidate; current++; } } } else { // current graph position is ringClosure if (candidate == mMatchTable[mFragmentGraphAtom[current]] && areBondsSimilar(mMolecule.getConnBond(mMatchTable[mFragmentGraphParentAtom[current]], index[current]), mFragmentGraphParentBond[current])) { current++; } } } } if (current == mFragmentGraphSize) { if (doTHParitiesMatch(-1) && doEZParitiesMatch(-1) && doBridgeBondsMatch(atomUsed, -1)) { // we currently have a match not considering exclude groups boolean isExcludedMatch = false; for (int excludeGroup=0; excludeGroup moleculeConnAtoms) return false; int moleculeQF = mMolecule.getAtomQueryFeatures(moleculeAtom); int fragmentQF = mFragment.getAtomQueryFeatures(fragmentAtom); int[] fragmentList = mFragment.getAtomList(fragmentAtom); int[] moleculeList = mMolecule.getAtomList(moleculeAtom); // check atomicNo's considering all 16 combinations of: Any set or not, atom list given or not if ((fragmentQF & Molecule.cAtomQFAny) != 0) { if (fragmentList != null) { if ((moleculeQF & Molecule.cAtomQFAny) != 0) { if (moleculeList == null) return false; if (!isSubListOf(fragmentList, moleculeList)) return false; } else { if (moleculeList != null) { if (listsOverlap(moleculeList, fragmentList)) return false; } else { if (isListMember(mMolecule.getAtomicNo(moleculeAtom), fragmentList)) return false; } } } } // 4 cases with Any set in fragment but no fragment exclude list given don't need to be checked else { // cAtomQFAny not set in fragment but Any set in molecule if ((moleculeQF & Molecule.cAtomQFAny) != 0) return false; // regardless of possibly given lists these 4 cases cannot match // remaining cases: Any neither set in fragment nor molecule, but check for lists if (fragmentList != null) { if (moleculeList != null) { if (!isSubListOf(moleculeList, fragmentList)) return false; } else { if (!isListMember(mMolecule.getAtomicNo(moleculeAtom), fragmentList)) return false; } } else { if (moleculeList != null) return false; if (mMoleculeAtomType[moleculeAtom] != mFragmentAtomType[fragmentAtom]) return false; } } // end atomicNo, cAtomQFAny and AtomList checking if ((moleculeQF | fragmentQF) != 0) { if ((fragmentQF & Molecule.cAtomQFNoMoreNeighbours) != 0) { if (mMolecule.isFragment() && (moleculeQF & Molecule.cAtomQFNoMoreNeighbours) == 0) return false; else if (fragmentConnAtoms != moleculeConnAtoms) return false; } if ((fragmentQF & Molecule.cAtomQFMoreNeighbours) != 0) { if ((fragmentConnAtoms >= moleculeConnAtoms) && (moleculeQF & Molecule.cAtomQFMoreNeighbours) == 0) return false; } } if ((mMoleculeAtomFeatures[moleculeAtom] & ~mFragmentAtomFeatures[fragmentAtom]) != 0) return false; if (mFragment.getAtomCharge(fragmentAtom) != 0 && mFragment.getAtomCharge(fragmentAtom) != mMolecule.getAtomCharge(moleculeAtom)) return false; if (mFragment.getAtomMass(fragmentAtom) != 0 && mFragment.getAtomMass(fragmentAtom) != mMolecule.getAtomMass(moleculeAtom)) return false; int ringSize = (mFragment.getAtomQueryFeatures(fragmentAtom) & Molecule.cAtomQFRingSize) >> Molecule.cAtomQFRingSizeShift; if (ringSize != 0) { if (mMolecule.isFragment() && ringSize == (mMolecule.getAtomQueryFeatures(fragmentAtom) & Molecule.cAtomQFRingSize) >> Molecule.cAtomQFRingSizeShift) return true; boolean found = false; RingCollection ringSet = mMolecule.getRingSet(); for (int i=0; i mMatchTable[connAtom2]) ^ (connAtom1 > connAtom2)) inversion = !inversion; } } } else { // allene parities for (int i=0; i mMatchTable[neighbour[1]]) ^(neighbour[0] > neighbour[1]))) inversion = !inversion; } } return inversion; } /** * Check whether all double bond parities required to match are compatible * with a match. * @return true if all E/Z parities match */ private boolean doEZParitiesMatch(int excludeGroupNo) { for (int fragmentBond=0; fragmentBond atom) relevantAtom[i] = atom; } } int memberCount = 0; if (ringSet.isAtomMember(r, relevantAtom[0])) memberCount++; if (ringSet.isAtomMember(r, relevantAtom[1])) memberCount++; if (memberCount == 2) return Molecule.cBondCIPParityZorM; if (memberCount == 1) return Molecule.cBondCIPParityEorP; return Molecule.cBondCIPParityZorM; } } return Molecule.cBondCIPParityNone; } // private boolean isEZParityInversion(int fragmentBond, int moleculeBond) { // boolean inversion = false; // for (int i=0; i<2; i++) { // int fragmentAtom = mFragment.getBondAtom(i, fragmentBond); // int moleculeAtom = mMatchTable[fragmentAtom]; // if (mFragment.getConnAtoms(fragmentAtom) == 2) { // if (mMolecule.getConnAtoms(moleculeAtom) == 2) // continue; // // int fragmentNeighbour = -1; // for (int j=0; j<2; j++) // if (mFragment.getConnBond(fragmentAtom, j) != fragmentBond) // fragmentNeighbour = mFragment.getConnAtom(fragmentAtom, j); // // int moleculeNeighbours = 0; // int[] moleculeNeighbour = new int[2]; // for (int j=0; j<3; j++) // if (mMolecule.getConnBond(moleculeAtom, j) != moleculeBond) // moleculeNeighbour[moleculeNeighbours++] = mMolecule.getConnAtom(moleculeAtom, j); // // if (mMatchTable[fragmentNeighbour] != moleculeNeighbour[0]) // inversion = !inversion; // } // else if (mFragment.getConnAtoms(fragmentAtom) == 3 // && mMolecule.getConnAtoms(moleculeAtom) == 3) { // int[] fragmentNeighbour = new int[2]; // int fragmentNeighbours = 0; // for (int j=0; j<3; j++) // if (mFragment.getConnBond(fragmentAtom, j) != fragmentBond) // fragmentNeighbour[fragmentNeighbours++] = mFragment.getConnAtom(fragmentAtom, j); // if ((mMatchTable[fragmentNeighbour[0]] > mMatchTable[fragmentNeighbour[1]]) // ^ (fragmentNeighbour[0] > fragmentNeighbour[1])) // inversion = !inversion; // } // } // return inversion; // } private boolean isEZParityInversion(int fragmentBond, int moleculeBond) { boolean inversion = false; for (int i=0; i<2; i++) { int fragmentAtom = mFragment.getBondAtom(i, fragmentBond); int moleculeAtom = mMatchTable[fragmentAtom]; if (mMolecule.getConnAtoms(moleculeAtom) > 2) { int otherFragmentAtom = mFragment.getBondAtom(1-i, fragmentBond); int lowFragmentNeighbour = Integer.MAX_VALUE; for (int j=0; j fragmentNeighbour) lowFragmentNeighbour = fragmentNeighbour; } int otherMoleculeAtom = mMatchTable[otherFragmentAtom]; int lowMoleculeNeighbour = Integer.MAX_VALUE; for (int j=0; j moleculeNeighbour) lowMoleculeNeighbour = moleculeNeighbour; } if (mMatchTable[lowFragmentNeighbour] != lowMoleculeNeighbour) inversion = !inversion; } } return inversion; } /** * Starting from a full match of the fragment without exclude groups, this method continues * the graph matching to find, whether the specified exclude group can also be matched. * @param atomUsed * @return */ private boolean isExcludeGroupMatch(boolean[] atomUsed, int[] index, int excludeGroupNo) { int excludeGroupGraphBase = mExcludeGroupGraphIndex[excludeGroupNo]; int excludeGroupGraphMax = excludeGroupGraphBase + 1; while (excludeGroupGraphMax < mFragmentGraphSizeWithExcludeGroups && mExcludeGroupNo[mFragmentGraphAtom[excludeGroupGraphMax]] == excludeGroupNo) excludeGroupGraphMax++; for (int i=excludeGroupGraphBase; i= mMolecule.getAtoms()) { index[current]++; continue; } int candidate = mMolecule.getConnAtom(mMatchTable[mFragmentGraphParentAtom[current]], index[current]); if (!mFragmentGraphIsRingClosure[current]) { // current graph position is not an anchor if (!atomUsed[candidate]) { if (areAtomsSimilar(candidate, mFragmentGraphAtom[current]) && areBondsSimilar(mMolecule.getConnBond(mMatchTable[mFragmentGraphParentAtom[current]], index[current]), mFragmentGraphParentBond[current])) { atomUsed[candidate] = true; mMatchTable[mFragmentGraphAtom[current]] = candidate; current++; } } } else { // current graph position is ringClosure if (candidate == mMatchTable[mFragmentGraphAtom[current]] && areBondsSimilar(mMolecule.getConnBond(mMatchTable[mFragmentGraphParentAtom[current]], index[current]), mFragmentGraphParentBond[current])) { current++; } } } if (current == excludeGroupGraphMax) { if (doTHParitiesMatch(excludeGroupNo) && doEZParitiesMatch(excludeGroupNo) && doBridgeBondsMatch(atomUsed, excludeGroupNo)) { // remove match table entries for exclude atoms for (int i=excludeGroupGraphBase; i * - Bridge bonds in the molecule are not matched to any fragment bond
* - Bridge bonds in the fragment are not considered in the graph-matching and
* checked after an otherwise successful match, whether the shortest path of
* unmatched atoms satisfies the min- and max-atom criteria.
* For fragment and(!) molecule containing bridge bonds we would need a more complex * handling: - for every fragment bridge check all unmatched molecule paths and count * for every path min- and max-lengths (considering all bridge bonds within path). * Consider a match, if min- and max-atoms range fits into fragments bridge bond range. * If we have multiple bridge bonds in fragment and partially overlapping bridge matches * in the molecule, it would get very nasty... * @param moleculeAtomUsed * @param excludeGroupNo * @return */ private boolean doBridgeBondsMatch(boolean[] moleculeAtomUsed, int excludeGroupNo) { if (mBridgeBondList != null) { for (BridgeBond bb:mBridgeBondList) { if (mExcludeGroupNo == null || (excludeGroupNo == -1 && mExcludeGroupNo[bb.atom1] == -1 && mExcludeGroupNo[bb.atom2] == -1) || (excludeGroupNo != -1 && (mExcludeGroupNo[bb.atom1] == excludeGroupNo || mExcludeGroupNo[bb.atom2] == excludeGroupNo))) { // if ((mIsExcludeAtom[bb.atom1] || mIsExcludeAtom[bb.atom2]) == isExcludeFragment) { int bridgeSize = mMolecule.getPathLength(mMatchTable[bb.atom1], mMatchTable[bb.atom2], bb.maxBridgeSize+1, moleculeAtomUsed) - 1; if (bridgeSize < bb.minBridgeSize || bridgeSize > bb.maxBridgeSize) return false; } } } return true; } /** * @param moleculeBond flag list of fragment bond features (features present) * @param fragmentBond flag list of molecule bond features (features allowed) * @return true if all molecule bond features are present in fragment bond */ public boolean areBondsSimilar(int moleculeBond, int fragmentBond) { if ((mMoleculeBondFeatures[moleculeBond] & ~mFragmentBondFeatures[fragmentBond]) != 0) return false; int ringSize = (mFragment.getBondQueryFeatures(fragmentBond) & Molecule.cBondQFRingSize) >> Molecule.cBondQFRingSizeShift; if (ringSize != 0) { if (mMolecule.isFragment() && ringSize == (mMolecule.getBondQueryFeatures(fragmentBond) & Molecule.cBondQFRingSize) >> Molecule.cBondQFRingSizeShift) return true; boolean found = false; RingCollection ringSet = mMolecule.getRingSet(); for (int i=0; i atomicNo1) return false; } return true; } private boolean listsOverlap(int[] list1, int[] list2) { // returns true if both lists share at least one common member int i1 = 0; int i2 = 0; while (i1 0) queryDefaults |= (Molecule.cAtomQFNotCharge0 | Molecule.cAtomQFNotChargeNeg); int hydrogens = mol.getAllHydrogens(atom); switch (hydrogens) { case 0: queryDefaults |= (Molecule.cAtomQFHydrogen & ~Molecule.cAtomQFNot0Hydrogen); break; case 1: queryDefaults |= (Molecule.cAtomQFHydrogen & ~Molecule.cAtomQFNot1Hydrogen); break; case 2: queryDefaults |= (Molecule.cAtomQFHydrogen & ~Molecule.cAtomQFNot2Hydrogen); break; default: queryDefaults |= (Molecule.cAtomQFHydrogen & ~Molecule.cAtomQFNot3Hydrogen); break; } int neighbours = mol.getConnAtoms(atom); switch (neighbours) { case 0: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot0Neighbours); break; case 1: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot1Neighbour); break; case 2: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot2Neighbours); break; case 3: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot3Neighbours); break; default: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot4Neighbours); break; } int piElectrons = mol.getAtomPi(atom); switch (piElectrons) { case 0: queryDefaults |= (Molecule.cAtomQFNot1PiElectron | Molecule.cAtomQFNot2PiElectrons); break; case 1: queryDefaults |= (Molecule.cAtomQFNot0PiElectrons | Molecule.cAtomQFNot2PiElectrons); break; default: queryDefaults |= (Molecule.cAtomQFNot0PiElectrons | Molecule.cAtomQFNot1PiElectron); break; } } else { // The fragments implicit features are not really necessary, // but may speed up the graph matching. if (mol.isAromaticAtom(atom)) queryDefaults |= Molecule.cAtomQFAromatic; int ringBonds = mol.getAtomRingBondCount(atom); if (ringBonds != 0) { queryDefaults |= Molecule.cAtomQFNotChain; if (ringBonds > 2) queryDefaults |= Molecule.cAtomQFNot2RingBonds; if (ringBonds > 3) queryDefaults |= Molecule.cAtomQFNot3RingBonds; } int charge = mol.getAtomCharge(atom); if (charge < 0) queryDefaults |= (Molecule.cAtomQFNotCharge0 | Molecule.cAtomQFNotChargePos); else if (charge > 0) queryDefaults |= (Molecule.cAtomQFNotCharge0 | Molecule.cAtomQFNotChargeNeg); // fragment atoms with n neighbours must have // at least n neighbours in a matching molecule int neighbours = mol.getConnAtoms(atom); switch (neighbours) { case 0: break; case 1: queryDefaults |= (Molecule.cAtomQFNot0Neighbours); break; case 2: queryDefaults |= (Molecule.cAtomQFNot0Neighbours | Molecule.cAtomQFNot1Neighbour); break; case 3: queryDefaults |= (Molecule.cAtomQFNot0Neighbours | Molecule.cAtomQFNot1Neighbour | Molecule.cAtomQFNot2Neighbours); break; default: queryDefaults |= (Molecule.cAtomQFNeighbours & ~Molecule.cAtomQFNot4Neighbours); break; } } int piElectrons = mol.getAtomPi(atom); if (piElectrons > 0) queryDefaults |= Molecule.cAtomQFNot0PiElectrons; if (piElectrons > 1) queryDefaults |= Molecule.cAtomQFNot1PiElectron; return queryDefaults; } /** * Generates inherent feature flags of a given bond. * @param mol molecule or fragment of the SSS * @param bond the bond of which to generate feature flags * @return bond features independent of query features */ private int getBondQueryDefaults(StereoMolecule mol, int bond) { int queryDefaults = 0; if (mol.isDelocalizedBond(bond) || mol.getBondType(bond) == Molecule.cBondTypeDelocalized) queryDefaults |= Molecule.cBondQFDelocalized; else switch (mol.getBondOrder(bond)) { case 0: queryDefaults |= Molecule.cBondTypeMetalLigand; break; case 1: queryDefaults |= Molecule.cBondQFSingle; break; case 2: queryDefaults |= Molecule.cBondQFDouble; break; case 3: queryDefaults |= Molecule.cBondQFTriple; break; } if (mol.isRingBond(bond)) queryDefaults |= Molecule.cBondQFRing; else if (!mol.isFragment()) queryDefaults |= Molecule.cBondQFNotRing; if (mol.isAromaticBond(bond)) queryDefaults |= Molecule.cBondQFAromatic; else if (!mol.isFragment()) queryDefaults |= Molecule.cBondQFNotAromatic; return queryDefaults; } private void buildBridgeBondList() { mBridgeBondList = null; for (int bond=0; bond(); BridgeBond bridgeBond = new BridgeBond(); bridgeBond.atom1 = mFragment.getBondAtom(0, bond); bridgeBond.atom2 = mFragment.getBondAtom(1, bond); bridgeBond.minBridgeSize = mFragment.getBondBridgeMinSize(bond); bridgeBond.maxBridgeSize = mFragment.getBondBridgeMaxSize(bond); mBridgeBondList.add(bridgeBond); } } } private class BridgeBond { int atom1,atom2,minBridgeSize,maxBridgeSize; } private static int[] copyOf(int[] original, int newLength) { int[] copy = new int[newLength]; System.arraycopy(original, 0, copy, 0, Math.min(original.length, newLength)); return copy; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy