All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.openscience.cdk.hash.MinimumEquivalentCyclicSetUnion Maven / Gradle / Ivy

/*
 * Copyright (c) 2013 John May 
 *
 * Contact: [email protected]
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public License
 * as published by the Free Software Foundation; either version 2.1
 * of the License, or (at your option) any later version.
 * All we ask is that proper credit is given for our work, which includes
 * - but is not limited to - adding the above copyright notice to the beginning
 * of your source code files, and to any copyright notice that you may distribute
 * with programs based on this work.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 U
 */

package org.openscience.cdk.hash;

import org.openscience.cdk.interfaces.IAtomContainer;
import org.openscience.cdk.ringsearch.RingSearch;

import java.util.Collections;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;
import java.util.TreeMap;

/**
 * The union of all the smallest set of equivalent values are members of a ring.
 * This class is intended to drive the systematic perturbation of the {@link
 * org.openscience.cdk.hash.PerturbedAtomHashGenerator}. The method is more
 * comprehensive then a single {@link MinimumEquivalentCyclicSet} and not as
 * computationally demanding as {@link AllEquivalentCyclicSet}. In reality one
 * should choose either use the fast (but good) heuristic {@link
 * MinimumEquivalentCyclicSet} or the exact {@link AllEquivalentCyclicSet}. This
 * method is provided for demonstration only.
 *
 * As with the {@link MinimumEquivalentCyclicSet} perturbation, this method does
 * not guarantee that all molecules will be distinguished. At the time of
 * writing (Feb 2013) there are only 8 structure in PubChem-Compound which need
 * the more comprehensive perturbation method ({@link AllEquivalentCyclicSet}),
 * these are listed below.
 *
 * 
 * 
 * 
 * 
 * 
CID 144432 * and CID 15584856
CID 138898 * and CID 241107
CID 9990759 * and CID 10899923
CID 5460768 * and CID 20673269
* *
The easiest way to use this class is with the {@link * org.openscience.cdk.hash.HashGeneratorMaker}. *
 * MoleculeHashGenerator generator =
 *   new HashGeneratorMaker().depth(6)
 *                           .elemental()
 *                           .perturbWith(new MinimumEquivalentCyclicSetUnion())
 *                           .molecular();
 * 
* * @author John May * @cdk.module hash * @see org.openscience.cdk.hash.PerturbedAtomHashGenerator * @see MinimumEquivalentCyclicSet * @see AllEquivalentCyclicSet * @deprecated provided for to demonstrate a relatively robust but ultimately * incomplete approach * @cdk.githash */ @Deprecated final class MinimumEquivalentCyclicSetUnion extends EquivalentSetFinder { /** *{@inheritDoc} */ @Override public Set find(long[] invariants, IAtomContainer container, int[][] graph) { int n = invariants.length; // find cyclic vertices using DFS RingSearch ringSearch = new RingSearch(container, graph); // ordered map of the set of vertices for each value Map> equivalent = new TreeMap>(); // divide the invariants into equivalent indexed and ordered sets for (int i = 0; i < invariants.length; i++) { Long invariant = invariants[i]; Set set = equivalent.get(invariant); if (set == null) { if (ringSearch.cyclic(i)) { set = new HashSet(n / 2); set.add(i); equivalent.put(invariant, set); } } else { set.add(i); } } // find the smallest set of equivalent cyclic vertices int minSize = Integer.MAX_VALUE; Set min = Collections.emptySet(); for (Map.Entry> e : equivalent.entrySet()) { Set vertices = e.getValue(); if (vertices.size() < minSize && vertices.size() > 1) { min = vertices; minSize = vertices.size(); } else if (vertices.size() == minSize) { min.addAll(vertices); } } return min; } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy