All Downloads are FREE. Search and download functionalities are using the official Maven repository.

gov.nih.ncats.molwitch.cdk.CdkAtom Maven / Gradle / Ivy

Go to download

MolWitch implementation that uses CDK as the underlying cheminformatics framework.

There is a newer version: 1.0.21
Show newest version
/*
 * NCATS-MOLWITCH-CDK
 *
 * Copyright (c) 2023.
 *
 * This work is free software; you can redistribute it and/or modify it under the terms of the
 * GNU Lesser General Public License as published by the Free Software Foundation;
 * either version 2.1 of the License, or (at your option) any later version.
 *
 * This work is distributed in the hope that it will be useful, but without any warranty;
 * without even the implied warranty of merchantability or fitness for a particular purpose.
 * See the GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License along with this library;
 *  if not, write to:
 *
 *  the Free Software Foundation, Inc.
 *  59 Temple Place, Suite 330
 *  Boston, MA 02111-1307 USA
 */

package gov.nih.ncats.molwitch.cdk;

import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Objects;
import java.util.Optional;
import java.util.OptionalInt;
import java.util.function.BiConsumer;
import java.util.function.Function;
import java.util.function.Supplier;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import javax.vecmath.Point2d;
import javax.vecmath.Point3d;

import org.openscience.cdk.AtomRef;
import org.openscience.cdk.CDKConstants;
import org.openscience.cdk.SingleElectron;
import org.openscience.cdk.config.IsotopeFactory;
import org.openscience.cdk.config.Isotopes;
import org.openscience.cdk.graph.Cycles;
import org.openscience.cdk.interfaces.*;
import org.openscience.cdk.isomorphism.matchers.IQueryAtom;
import org.openscience.cdk.isomorphism.matchers.RGroupQuery;
import org.openscience.cdk.tools.manipulator.AtomContainerManipulator;

import gov.nih.ncats.molwitch.Atom;
import gov.nih.ncats.molwitch.AtomCoordinates;
import gov.nih.ncats.molwitch.Bond;
import gov.nih.ncats.molwitch.Bond.BondType;
import gov.nih.ncats.molwitch.Bond.Stereo;
import gov.nih.ncats.molwitch.Chirality;
import uk.ac.ebi.beam.Element;

public class CdkAtom implements Atom{
	
	private static final Pattern validLabelPattern = Pattern.compile("^R\\d+$");
	 

	private static IsotopeFactory isotopeFactory;
	
	static {
		try {
		isotopeFactory = Isotopes.getInstance();
		}catch(IOException e) {
			throw new IllegalStateException("error loading isotope data", e);
		}
	}
	
	private IAtom atom;
	private CdkChemicalImpl parent;
	
	public static IAtom getIAtomFor(Atom a){
		return ((CdkAtom)a).atom;
	}
	
	public CdkAtom(IAtom atom, CdkChemicalImpl parent) {
		Objects.requireNonNull(atom);
		
		this.parent = parent;
		this.atom = atom;
		
	}
	
	

	@Override
	public boolean isValidAtomicSymbol() {
		return Element.ofSymbol(getSymbol()) !=null;
	}

	@Override
	public int getSmallestRingSize() {
		//this should set the ISINRING flags
		parent.ringsSearcherSupplier.get();
		if( !atom.isInRing()) {
			return 0;
		};
	
		
		IRingSet ringSet = Cycles.sssr(((IAtomContainer) parent.getWrappedObject())).toRingSet();
		if(!ringSet.contains(atom)) {
			return 0;
		}
		int min = Integer.MAX_VALUE;
		for(IAtomContainer r : ringSet.atomContainers()) {
			if(r.contains(atom)) {
				int len = r.getAtomCount();
				if(len < min) {
					min = len;
				}
			}
		}
		
		return min;
	}



	@Override
	public boolean isQueryAtom() {
		return AtomRef.deref(atom) instanceof IQueryAtom;
	}



	@Override
	public OptionalInt getAtomToAtomMap() {
		Object atomAtomMapping = atom.getProperty(CDKConstants.ATOM_ATOM_MAPPING);
		if(atomAtomMapping ==null) {
			return OptionalInt.empty();
		}
		int value=0;
		if (atomAtomMapping instanceof String) {
            	//this will throw a IllegalArgumentException (runtime)
            value = Integer.parseInt((String) atomAtomMapping);
		}else if(atomAtomMapping instanceof Integer) {
			value = (Integer) atomAtomMapping;
		}
		if(value ==0) {
			return OptionalInt.empty();
		}
		return OptionalInt.of(value);
	}

	@Override
	public void setAtomToAtomMap(int value) {
		if(value ==0) {
			atom.removeProperty(CDKConstants.ATOM_ATOM_MAPPING);
		}else {
			atom.setProperty(CDKConstants.ATOM_ATOM_MAPPING, value);
		}
		
	}

	@Override
	public boolean isInRing() {
		//this should set the ISINRING flags
		parent.ringsSearcherSupplier.get();
		return atom.isInRing();
	}

	@Override
	public String getSymbol() {
		return atom.getSymbol();
	}
	
	

	@Override
	public boolean isIsotope() {
		Integer mass = atom.getMassNumber();
		if(mass ==null) {
			return false;
		}

		double majorMass = isotopeFactory.getMajorIsotopeMass(atom.getAtomicNumber());
		if(majorMass == 2D* getAtomicNumber()){
			//no major mass
			return true;
		}
		return !(Double.valueOf(mass).equals(majorMass));
	}

	@Override
	public List getBonds() {
		return parent.getBondsFor(atom);
	}

	IAtom getAtom() {
		return atom;
	}

	@Override
	public int getAtomicNumber() {
		return atom.getAtomicNumber();
	}

	@Override
	public void setAtomicNumber(int atomicNumber) {
		atom.setAtomicNumber(atomicNumber);
	}

	@Override
	public boolean hasAromaticBond() {
		return atom.isAromatic();
	}

	@Override
	public int hashCode() {
		final int prime = 31;
		int result = 1;
		result = prime * result + atom.hashCode();
		return result;
	}

	@Override
	public boolean equals(Object obj) {
		if (this == obj)
			return true;
		if (obj == null)
			return false;
		if (getClass() != obj.getClass())
			return false;
		CdkAtom other = (CdkAtom) obj;
		if (!atom.equals(other.atom))
			return false;
		return true;
	}

	@Override
	public int getCharge() {
		Integer charge = atom.getFormalCharge();
		//assume unset = 0 ?
		if(charge ==null || CDKConstants.UNSET == charge){
			return 0;
		}
		return charge.intValue();
	}

	@Override
	public int getRadical() {
		List list = parent.getContainer().getConnectedSingleElectronsList(atom);
		if(list.isEmpty()) {
			return 0;
		}
		return list.stream().map(ise -> ise.getElectronCount()).filter(Objects::nonNull).mapToInt(Integer::intValue).sum();
	}

	@Override
	public void setRadical(int radical) {

		//check old radical value don't do anything if match
		int oldValue = getRadical();
		if(oldValue == radical){
			return;
		}
		ISingleElectron ise = new SingleElectron(atom);
		ise.setElectronCount(radical);

		IAtomContainer container = parent.getContainer();
		container.getConnectedSingleElectronsList(atom)
								.forEach(container::removeSingleElectron);

		container.addSingleElectron(ise);

	}


	@Override
	public AtomCoordinates getAtomCoordinates() {
		Point3d points = atom.getPoint3d();
		if(points !=null) {
			return AtomCoordinates.valueOf(points.x, points.y, points.z);
		}
		Point2d otherPoints = atom.getPoint2d();
		if(otherPoints !=null) {
			return AtomCoordinates.valueOf(otherPoints.x, otherPoints.y);
		}
		return null;
	}

	@Override
	public void setAtomCoordinates(AtomCoordinates atomCoordinates) {
		if(atomCoordinates ==null) {
			atom.setPoint2d(null);
			atom.setPoint3d(null);
		}else if(atomCoordinates.is3D()) {
			atom.setPoint2d(null);
			atom.setPoint3d(new Point3d(atomCoordinates.getX(), atomCoordinates.getY(), atomCoordinates.getZ().getAsDouble()));
		}else {
			atom.setPoint3d(null);
			atom.setPoint2d(new Point2d(atomCoordinates.getX(), atomCoordinates.getY()));
		
		}
		
	}

	
	

	@Override
	public Chirality getChirality() {
		if(!parent.cahnIngoldPrelogSupplier.hasRun()) {
			//forces running CIP rules
		
			parent.getTetrahedrals();
		}
		String value= Optional.ofNullable(atom.getProperty(CDKConstants.CIP_DESCRIPTOR))
				.map(t->t.toString())
				.orElse(null);
		
//		if(dd!=nu)
//		String value = atom.getProperty(CDKConstants.CIP_DESCRIPTOR);
//		
		if("R".equals(value) || "M".equals(value)) {
			return Chirality.R;
		}
		if("r".equals(value)) {
			return Chirality.r;
		}
		
		if("S".equals(value) || "P".equals(value)) {
			return Chirality.S;
		}
		
		if("s".equals(value)) {
			return Chirality.s;
		}
		
		if("EITHER".equals(value)) {
			return Chirality.Parity_Either;
		}
		
		return Chirality.Non_Chiral;
	}

	@Override
	public void setChirality(Chirality chirality) {
	    Chirality chir=getChirality();
	    if(chir==chirality)return;
	    
	    //simple inversion
	    if(((chirality==Chirality.R || chirality==Chirality.r)  && (chir==Chirality.S||chir==Chirality.s)) ||
	       ((chirality==Chirality.S || chirality==Chirality.s)  && (chir==Chirality.R||chir==Chirality.r)) 
	            ) {
	        this.getBonds().stream()
	        .filter(b->b.getBondType().equals(BondType.SINGLE))
	        .filter(b->!b.getStereo().equals(Stereo.NONE))
	        .forEach(bb->{
	            Stereo bbs=bb.getStereo();
	            if((bb.getAtom1().equals(this) && (bbs.equals(Stereo.UP) || bbs.equals(Stereo.DOWN))) ||
	                    (bb.getAtom2().equals(this) && (bbs.equals(Stereo.UP_INVERTED) || bbs.equals(Stereo.DOWN_INVERTED)))
	                    ) {
	                bb.setStereo(bbs.flip());
	            }
	        });

	        atom.setProperty(CDKConstants.CIP_DESCRIPTOR,chirality.toString());
//	        atom.setStereoParity((atom.getStereoParity()+1)%2);
//	        parent.getContainer().setStereoElements(new ArrayList<>());
	        
	    //simple removal
	    }else if(chirality.equals(Chirality.Parity_Either)) {
	        this.getBonds().stream()
            .filter(b->b.getBondType().equals(BondType.SINGLE))
            .filter(b->!b.getStereo().equals(Stereo.NONE))
            .forEach(bb->{
                Stereo bbs=bb.getStereo();
                if((bb.getAtom1().equals(this) && (bbs.equals(Stereo.UP) || bbs.equals(Stereo.DOWN))) ||
                        (bb.getAtom2().equals(this) && (bbs.equals(Stereo.UP_INVERTED) || bbs.equals(Stereo.DOWN_INVERTED)))
                        ) {
                    bb.setStereo(Stereo.NONE);
                }
            });

	        atom.setProperty(CDKConstants.CIP_DESCRIPTOR,"EITHER");
	    }else if(chirality.isDefined() && (chir.isEither() || chir == Chirality.Non_Chiral)) {
	    
	    	Optional sBond = this.getBonds().stream()
            .filter(b->b.getBondType().equals(BondType.SINGLE))
            .filter(b->b.getStereo().equals(Stereo.NONE))
            .findFirst();
	    	
	    	
            sBond.ifPresent(b->{
            	if(b.getAtom1().getAtomIndexInParent()==this.getAtomIndexInParent()){
            		b.setStereo(Stereo.UP);
            	}else {
            		b.setStereo(Stereo.UP_INVERTED);
            	}
            });
            
            
	    	parent.cahnIngoldPrelogSupplier.resetCache();
	    	Chirality co=this.getChirality();
	    	if((co.isRForm() && chirality.isRForm()) || 
	    			(co.isSForm() && chirality.isSForm())
	    			) {
	    		//do nothing	
	    	}else if((co.isSForm() && chirality.isRForm()) || 
	    			(co.isRForm() && chirality.isSForm())
	    			) {
	    		setChirality(chirality);
	    	}else {
	    		//could not set
	    	}
	        
	    }
	    
//	    parent.cahnIngoldPrelogSupplier.resetCache();
	}

	@Override
	public int getMassNumber() {
		Integer num= atom.getMassNumber();
		if(num==null){
			return 0;
		}
		return num.intValue();
	}
	

	@Override
	public double getExactMass() {
		// TODO Auto-generated method stub
		Double d= atom.getExactMass();
		if(d ==null) {
			return 0;
		}
		return d.doubleValue();
	}

	@Override
	public void setCharge(int charge) {
		atom.setFormalCharge(charge);

//		recomputeImplicitHydrogens();
	}

	private void recomputeImplicitHydrogens() {
		atom.setImplicitHydrogenCount(null);
		parent.setImplicitHydrogens(atom);
	}

	@Override
	public void setMassNumber(int mass) {
		if(mass <0){
			throw new IllegalArgumentException("mass can not be negative");
		}
		if(mass ==0){
			atom.setMassNumber(null);
		}else{
			atom.setMassNumber(mass);
		}
//		recomputeImplicitHydrogens();
	}

	@Override
	public int getImplicitHCount() {
		Integer ret = atom.getImplicitHydrogenCount();
		if(ret ==null){
			//bug in hydrogen count
			if(isQueryAtom()){
				return 0;
			}
			for(Bond b : getBonds()){
				if(b.isQueryBond()){
					return 0;
				}
			}
			//compute it
			return parent.setImplicitHydrogens(atom);
			
		}
		return ret;
	}
	

	@Override
	public void setImplicitHCount(Integer implicitH) {
		atom.setImplicitHydrogenCount(implicitH);
	}



	@Override
	public OptionalInt getValence() {
		parent.perceiveAtomTypesOfNonQueryAtoms.get();
		
		Integer valence= atom.getValency();
		if(valence ==null) {
			return OptionalInt.empty();
		}
		return OptionalInt.of(valence);
	}
	

	@Override
	public boolean hasValenceError() {
		//after perceiving atom types valence should not be null unless there's an error?
		//TODO maybe not set on query atoms?
		OptionalInt opin=getValence();
		if(!opin.isPresent())return true;
		
		int v = opin.getAsInt();
		
		// TODO: Need a real valence model check here ...
		// CDK probably has one. Generally specific elements
		// are only allowed to have certain valences. That is,
		// there are only certain bond count/charge/radical
		// configurations that are allowed. The most common
		// case we're worried about though is pentavalent
		// carbon. So we'll currently just throw an error
		// on that one case.
		
		if("C".equals(this.getSymbol()) && v>4){
			return true;
		}
		if("N".equals(this.getSymbol())){
			if(v==5){
				if(this.getCharge()==1){
					return false;
				}else{
					return true;
				}
			}
		}
		
		return false;
	}

	@Override
	public boolean isRGroupAtom() {
		return getRGroupIndex().isPresent();
	}

	@Override
	public boolean isPseudoAtom() {
		return CdkUtil.isPseudoAtom(atom);
	}

	@Override
	public OptionalInt getRGroupIndex() {
		
		return getPseudoAtomField(iPseudoAtom -> {
			String label = iPseudoAtom.getLabel();
			 if(label !=null && isValidRgroupQueryLabel(label)) {
				 return OptionalInt.of(Integer.parseInt(label.substring(1)));
			 }
			 return OptionalInt.empty();
		},
				OptionalInt::empty);

	}


	@Override
	public void setRGroup(Integer rGroup) {
		if(rGroup ==null || rGroup < 1) {
			if(isRGroupAtom()) {
				setAlias(null);
			}
		}else {
			setAlias("R"+rGroup);
		}
	}

	private  T getPseudoAtomField(Function function, Supplier emptySupplier) {
		IAtom deref = AtomRef.deref(atom);
		if(deref instanceof IPseudoAtom) {
			IPseudoAtom iPseudoAtom = (IPseudoAtom)deref;
			return function.apply(iPseudoAtom);
		}
		return emptySupplier.get();
	}

	@Override
	public Optional getAlias() {
		return getPseudoAtomField( a-> Optional.ofNullable(a.getLabel()), Optional::empty);
	}

	@Override
	public void setAlias(String alias) {
		changeToPseudoAtomIfNeeded((pseudoAtom, newObj) -> {
			pseudoAtom.setLabel(alias);
			if(newObj) {
				pseudoAtom.setSymbol(alias);
			}
			
		});
		
	}
	
	

	//borrowed from CDK MDLV20000Reader with minor adjustments
	//to make it take consumers for various operations
	
	private void changeToPseudoAtomIfNeeded(BiConsumer consumer) {
		IAtomContainer container = parent.getContainer();
	 final IPseudoAtom pseudoAtom = atom instanceof IPseudoAtom ? (IPseudoAtom) atom : container.getBuilder()
             .newInstance(IPseudoAtom.class);
     if (atom.equals(pseudoAtom)) {
    	 consumer.accept(pseudoAtom, false);
     } else {
    	 //some consumers might change the symbol but by default reuse atom symbol
         pseudoAtom.setSymbol(atom.getSymbol());
         pseudoAtom.setAtomicNumber(0);
         pseudoAtom.setPoint2d(atom.getPoint2d());
         pseudoAtom.setPoint3d(atom.getPoint3d());
         pseudoAtom.setMassNumber(atom.getMassNumber());
         pseudoAtom.setFormalCharge(atom.getFormalCharge());
         pseudoAtom.setValency(atom.getValency());
         
         consumer.accept(pseudoAtom, true);
         //katzelda -chemkit note : need to update atom and bond caches
 		//Looking into the source code for this method
         //it doesn't make  new IBond objects just
         //updates the fields for  IBond objects
         //so we should  be OK and don't have to update our caches...
         
 		 // XXX: would be faster to track all replacements and do it all in one
         AtomContainerManipulator.replaceAtomByAtom(container, atom, pseudoAtom);
        
         this.atom = pseudoAtom;
     }
	}

	@Override
	public String toString() {
		return "CdkAtom [atom=" + atom + "]";
	}



	@Override
	public int getAtomIndexInParent() {
		return parent.getContainer().indexOf(atom);
	}

    /**
     * Validates a Pseudo atom's label to be valid RGroup query label (R1..R32).
     * @param Rxx R-group label like R1 or R10
     * @return true if R1..R32+, otherwise false
     */
    public static boolean isValidRgroupQueryLabel(String Rxx) {
        Matcher matcher = validLabelPattern.matcher(Rxx);
        if (matcher.find()) {
            int groupNumber = Integer.parseInt(Rxx.substring(1));
            //Note that CDK restricts to only R32 and below, but we are allowing larger here
            
            if (groupNumber >= 1) {
                return true;
            }
        }
        return false;
    }

	

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy