org.coode.owlapi.obo.parser.OBOConsumer Maven / Gradle / Ivy
/*
* This file is part of the OWL API.
*
* The contents of this file are subject to the LGPL License, Version 3.0.
*
* Copyright (C) 2011, The University of Manchester
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see http://www.gnu.org/licenses/.
*
*
* Alternatively, the contents of this file may be used under the terms of the Apache License, Version 2.0
* in which case, the provisions of the Apache License Version 2.0 are applicable instead of those above.
*
* Copyright 2011, University of Manchester
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.coode.owlapi.obo.parser;
import java.net.URI;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;
import java.util.logging.Logger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.semanticweb.owlapi.model.AddAxiom;
import org.semanticweb.owlapi.model.AddImport;
import org.semanticweb.owlapi.model.AddOntologyAnnotation;
import org.semanticweb.owlapi.model.IRI;
import org.semanticweb.owlapi.model.OWLAnnotation;
import org.semanticweb.owlapi.model.OWLAnnotationAssertionAxiom;
import org.semanticweb.owlapi.model.OWLAnnotationProperty;
import org.semanticweb.owlapi.model.OWLAnnotationValue;
import org.semanticweb.owlapi.model.OWLAxiom;
import org.semanticweb.owlapi.model.OWLClass;
import org.semanticweb.owlapi.model.OWLClassExpression;
import org.semanticweb.owlapi.model.OWLDataFactory;
import org.semanticweb.owlapi.model.OWLDeclarationAxiom;
import org.semanticweb.owlapi.model.OWLEntity;
import org.semanticweb.owlapi.model.OWLImportsDeclaration;
import org.semanticweb.owlapi.model.OWLLiteral;
import org.semanticweb.owlapi.model.OWLOntology;
import org.semanticweb.owlapi.model.OWLOntologyID;
import org.semanticweb.owlapi.model.OWLOntologyLoaderConfiguration;
import org.semanticweb.owlapi.model.OWLOntologyManager;
import org.semanticweb.owlapi.model.OWLRuntimeException;
import org.semanticweb.owlapi.model.SetOntologyID;
import org.semanticweb.owlapi.model.UnloadableImportException;
import org.semanticweb.owlapi.util.CollectionFactory;
/**
* Author: Matthew Horridge
* The University Of Manchester
* Bio-Health Informatics Group
* Date: 10-Jan-2007
*/
@SuppressWarnings("javadoc")
public class OBOConsumer implements OBOParserHandler {
private static final Logger logger = Logger.getLogger(OBOConsumer.class.getName());
private static final String IMPORT_TAG_NAME = "import";
private OWLOntologyLoaderConfiguration configuration;
private OWLOntologyManager owlOntologyManager;
private OWLOntology ontology;
private boolean inHeader;
private String currentId;
private Map handlerMap;
// private String defaultNamespace;
private String defaultNamespaceTagValue = OBOVocabulary.OBO_IRI_BASE;
private String stanzaType;
private boolean termType;
private boolean typedefType;
private boolean instanceType;
private Set intersectionOfOperands;
private Set unionOfOperands;
private Map uriCache = new HashMap();
private Map symbolicIdCache = new HashMap();
private Map tagIRICache = new HashMap();
private IDSpaceManager idSpaceManager = new IDSpaceManager();
private String ontologyTagValue = "";
private String dataVersionTagValue = "";
public OBOConsumer(OWLOntology ontology, OWLOntologyLoaderConfiguration configuration, IRI baseIRI) {
this.configuration = configuration;
owlOntologyManager = ontology.getOWLOntologyManager();
this.ontology = ontology;
intersectionOfOperands = new HashSet();
unionOfOperands = new HashSet();
uriCache = new HashMap();
for (OBOVocabulary v : OBOVocabulary.values()) {
tagIRICache.put(v.getName(), v.getIRI());
}
ontologyTagValue = getDefaultOntologyTagValue(baseIRI);
loadBuiltinURIs();
setupTagHandlers();
}
private String getDefaultOntologyTagValue(IRI baseIRI) {
URI baseURI = baseIRI.toURI();
String baseURIPath = baseURI.getPath();
if(baseURIPath == null) {
return baseIRI.toString();
}
int lastSlashIndex = baseURIPath.lastIndexOf("/");
if(lastSlashIndex == -1 || lastSlashIndex + 1 == baseURIPath.length()) {
return baseURIPath;
}
return baseURIPath.substring(lastSlashIndex + 1);
}
@Deprecated
@SuppressWarnings("unused")
public OBOConsumer(OWLOntologyManager owlOntologyManager, OWLOntology ontology, OWLOntologyLoaderConfiguration configuration, IRI baseIRI) {
this(ontology, configuration, baseIRI);
}
public OWLOntologyManager getOWLOntologyManager() {
return owlOntologyManager;
}
public OWLOntology getOntology() {
return ontology;
}
public String getCurrentId() {
return currentId;
}
public void addSymbolicIdMapping(String symbolicName, IRI fullIRI) {
symbolicIdCache.put(symbolicName, fullIRI);
}
/**
* Sets the value of the default-namespace tag for the current ontology being parsed.
* @param defaultNamespaceTagValue The value of the default-namespace tag.
*/
public void setDefaultNamespaceTagValue(String defaultNamespaceTagValue) {
this.defaultNamespaceTagValue = defaultNamespaceTagValue;
}
/**
* Gets the default-namespace tag value for the current ontology. If not default-namespace tag value has been set
* explicitly then this method returns the default value which is equal to {@link OBOVocabulary#OBO_IRI_BASE}.
* @return The default-namespace tag value. Not null
.
*/
public String getDefaultNamespaceTagValue() {
return defaultNamespaceTagValue;
}
/**
* Sets the value of the ontology tag for the current ontology that is being parsed. This is used to construct
* an {@link org.semanticweb.owlapi.model.OWLOntologyID} for the current ontology once the ontology header has
* been parsed in its entirety.
* @param ontologyTagValue The ontology tag value. Ultimately, this will be translated to an IRI.
*/
public void setOntologyTagValue(String ontologyTagValue) {
this.ontologyTagValue = ontologyTagValue;
}
/**
* Sets the value of the data-version tag for the current ontology that is being parsed. This is used to construct
* an {@link org.semanticweb.owlapi.model.OWLOntologyID} for the current ontology once the ontology header has
* been parsed in its entirety.
* @param dataVersionTagValue The data-version tag value. Ultimately, this will be translated to an IRI.
*/
public void setDataVersionTagValue(String dataVersionTagValue) {
this.dataVersionTagValue = dataVersionTagValue;
}
public void registerIdSpace(String idSpacePrefix, String iriPrefix) {
idSpaceManager.setIRIPrefix(idSpacePrefix, iriPrefix);
}
/**
* Gets a COPY of the {@link IDSpaceManager} held by this OBOConsumer.
* @return A copy of the IDSpaceManager held by this consumer.
*/
public IDSpaceManager getIdSpaceManager() {
return idSpaceManager;
}
public void setCurrentId(String currentId) {
this.currentId = currentId;
}
public void addUnionOfOperand(OWLClassExpression classExpression) {
unionOfOperands.add(classExpression);
}
public void addIntersectionOfOperand(OWLClassExpression classExpression) {
intersectionOfOperands.add(classExpression);
}
public String getStanzaType() {
return stanzaType;
}
public boolean isTerm() {
return termType;
}
public boolean isTypedef() {
return typedefType;
}
public boolean isInstanceType() {
return instanceType;
}
private void loadBuiltinURIs() {
for (OBOVocabulary v : OBOVocabulary.values()) {
uriCache.put(v.getName(), v.getIRI());
}
}
private void setupTagHandlers() {
handlerMap = new HashMap();
addTagHandler(new OntologyTagValueHandler(this));
addTagHandler(new IDTagValueHandler(this));
addTagHandler(new NameTagValueHandler(this));
addTagHandler(new IsATagValueHandler(this));
addTagHandler(new PartOfTagValueHandler(this));
addTagHandler(new TransitiveTagValueHandler(this));
addTagHandler(new SymmetricTagValueHandler(this));
addTagHandler(new RelationshipTagValueHandler(this));
addTagHandler(new UnionOfHandler(this));
addTagHandler(new IntersectionOfHandler(this));
addTagHandler(new DisjointFromHandler(this));
addTagHandler(new AsymmetricHandler(this));
addTagHandler(new InverseHandler(this));
addTagHandler(new ReflexiveHandler(this));
addTagHandler(new TransitiveOverHandler(this));
addTagHandler(new DefaultNamespaceTagValueHandler(this));
addTagHandler(new SynonymTagValueHandler(this));
addTagHandler(new XRefTagHandler(this));
addTagHandler(new DefTagValueHandler(this));
addTagHandler(new IsObsoleteTagValueHandler(this));
addTagHandler(new IDSpaceTagValueHandler(this));
addTagHandler(new DataVersionTagValueHandler(this));
addTagHandler(new SynonymTypeDefTagHandler(this));
addTagHandler(new AltIdTagValueHandler(this));
}
private void addTagHandler(TagValueHandler handler) {
handlerMap.put(handler.getTagName(), handler);
}
@Override
public void startHeader() {
inHeader = true;
}
@Override
public void endHeader() {
inHeader = false;
setOntologyId();
}
/**
* Sets the {@link org.semanticweb.owlapi.model.OWLOntologyID} of the ontology being parsed from the tag values
* held by the {@link #ontologyTagValue} and {@link #dataVersionTagValue} field. IRIs for each field are generated
* and used to construct the {@link org.semanticweb.owlapi.model.OWLOntologyID}.
*/
private void setOntologyId() {
IRI ontologyIRI = IRI.create(idSpaceManager.getIRIPrefix(ontologyTagValue) + ontologyTagValue);
IRI versionIRI = null;
if (dataVersionTagValue.length()>0) {
versionIRI = IRI.create(ontologyIRI.toString() + "/" + dataVersionTagValue);
}
OWLOntologyID ontologyID = new OWLOntologyID(ontologyIRI, versionIRI);
ontology.getOWLOntologyManager().applyChange(new SetOntologyID(ontology, ontologyID));
}
@Override
public void startFrame(String name) {
currentId = null;
defaultNamespaceTagValue = null;
stanzaType = name;
termType = stanzaType.equals(OBOVocabulary.TERM.getName());
typedefType = false;
instanceType = false;
if (!termType) {
typedefType = stanzaType.equals(OBOVocabulary.TYPEDEF.getName());
if (!typedefType) {
instanceType = stanzaType.equals(OBOVocabulary.INSTANCE.getName());
}
}
}
@Override
public void endFrame() {
if (!unionOfOperands.isEmpty()) {
createUnionEquivalentClass();
unionOfOperands.clear();
}
if (!intersectionOfOperands.isEmpty()) {
createIntersectionEquivalentClass();
intersectionOfOperands.clear();
}
}
private void createUnionEquivalentClass() {
OWLClassExpression equivalentClass;
if (unionOfOperands.size() == 1) {
equivalentClass = unionOfOperands.iterator().next();
}
else {
equivalentClass = getDataFactory().getOWLObjectUnionOf(unionOfOperands);
}
createEquivalentClass(equivalentClass);
}
private void createIntersectionEquivalentClass() {
OWLClassExpression equivalentClass;
if (intersectionOfOperands.size() == 1) {
equivalentClass = intersectionOfOperands.iterator().next();
}
else {
equivalentClass = getDataFactory().getOWLObjectIntersectionOf(intersectionOfOperands);
}
createEquivalentClass(equivalentClass);
}
private void createEquivalentClass(OWLClassExpression classExpression) {
OWLAxiom ax = getDataFactory().getOWLEquivalentClassesAxiom(CollectionFactory.createSet(getCurrentClass(), classExpression));
getOWLOntologyManager().applyChange(new AddAxiom(ontology, ax));
}
@Override
public void handleTagValue(String tag, String value, String qualifierBlock, String comment) {
try {
TagValueHandler handler = handlerMap.get(tag);
if (handler != null) {
handler.handle(currentId, value, qualifierBlock, comment);
}
else if (inHeader) {
if (tag.equals(IMPORT_TAG_NAME)) {
IRI uri = IRI.create(value.trim());
OWLImportsDeclaration decl = owlOntologyManager.getOWLDataFactory().getOWLImportsDeclaration(uri);
owlOntologyManager.makeLoadImportRequest(decl, configuration);
owlOntologyManager.applyChange(new AddImport(ontology, decl));
}
else {
// Ontology annotations
OWLLiteral con = getDataFactory().getOWLLiteral(unescapeTagValue(value));
OWLAnnotationProperty property = getDataFactory().getOWLAnnotationProperty(getIRIFromTagName(tag));
OWLAnnotation anno = getDataFactory().getOWLAnnotation(property, con);
owlOntologyManager.applyChange(new AddOntologyAnnotation(ontology, anno));
}
}
else if (currentId != null) {
// Add as annotation
if (configuration.isLoadAnnotationAxioms()) {
IRI subject = getIRI(currentId);
OWLLiteral con = getDataFactory().getOWLLiteral(unescapeTagValue(value));
IRI annotationPropertyIRI = getIRIFromTagName(tag);
OWLAnnotationProperty property = getDataFactory().getOWLAnnotationProperty(annotationPropertyIRI);
OWLAnnotation anno = getDataFactory().getOWLAnnotation(property, con);
OWLAnnotationAssertionAxiom ax = getDataFactory().getOWLAnnotationAssertionAxiom(subject, anno);
owlOntologyManager.addAxiom(ontology, ax);
OWLDeclarationAxiom annotationPropertyDeclaration = getDataFactory().getOWLDeclarationAxiom(property);
owlOntologyManager.addAxiom(ontology, annotationPropertyDeclaration);
}
}
}
catch (UnloadableImportException e) {
logger.severe(e.getMessage());
}
}
public String unescapeTagValue(String value) {
String unquoted;
if (value.startsWith("\"") && value.endsWith("\"")) {
unquoted = value.substring(1, value.length() - 1);
}
else {
unquoted = value;
}
StringBuilder sb = new StringBuilder();
for (int i = 0; i < unquoted.length(); i++) {
char ch = unquoted.charAt(i);
if (ch != '\\') {
sb.append(ch);
}
}
return sb.toString();
}
private OWLDataFactory getDataFactory() {
return getOWLOntologyManager().getOWLDataFactory();
}
public OWLClass getCurrentClass() {
return getDataFactory().getOWLClass(getIRI(currentId));
}
public OWLEntity getCurrentEntity() {
if (isTerm()) {
return getCurrentClass();
}
else if (isTypedef()) {
// Sometimes, we can have symbolic names e.g. has_part. It's not really clear how to tell the difference
IRI propertyIRI = getRelationIRIFromSymbolicIdOrOBOId(currentId);
return getDataFactory().getOWLObjectProperty(propertyIRI);
}
else {
return getDataFactory().getOWLNamedIndividual(getIRI(currentId));
}
}
/**
* Gets an IRI from a tag name.
* @param tagName The tag name.
* @return The IRI for the tag name. For built in tags this is obtained from the {@link OBOVocabulary} enum.
* Not null
.
* @throws NullPointerException if tagName is null.
*/
public IRI getIRIFromTagName(String tagName) {
if (tagName == null) {
throw new NullPointerException("tagName must not be null");
}
IRI tagIRI = tagIRICache.get(tagName);
if (tagIRI != null) {
return tagIRI;
}
else {
IRI freshTagIRI = IRI.create(OBOVocabulary.OBO_IRI_BASE + tagName);
tagIRICache.put(tagName, freshTagIRI);
return freshTagIRI;
}
}
/**
* Gets an IRI from an OBO ID. The OBO ID may be a canonical OBO ID of the form idspace:sequence or it may be
* a non-canonical ID.
* @param oboId The OBO ID
* @return An IRI obtained from the translation of the OBO ID.
*/
public IRI getIRIFromOBOId(String oboId) {
if (oboId == null) {
throw new NullPointerException("oboId must not be null.");
}
return getIRI(oboId);
}
public IRI getRelationIRIFromSymbolicIdOrOBOId(String symbolicIdOrOBOId) {
IRI fullIRI = symbolicIdCache.get(symbolicIdOrOBOId);
if(fullIRI != null) {
return fullIRI;
}
OBOIdType idType = OBOIdType.getIdType(symbolicIdOrOBOId);
if (idType == null) {
throw new OWLRuntimeException("Invalid ID: " + symbolicIdOrOBOId
+ " in frame " + currentId);
}
else {
return idType.getIRIFromOBOId(ontology.getOntologyID(), idSpaceManager, symbolicIdOrOBOId);
}
}
private IRI getIRI(String s) {
String trimmed = s.trim();
IRI iri = uriCache.get(trimmed);
if (iri != null) {
return iri;
}
OWLOntologyID ontologyID = getOntology().getOntologyID();
OBOIdType type = OBOIdType.getIdType(trimmed);
if (type == null) {
throw new OWLRuntimeException("Not a valid OBO ID: " + s);
}
IRI freshIRI = type.getIRIFromOBOId(ontologyID, idSpaceManager, trimmed);
uriCache.put(trimmed, freshIRI);
return freshIRI;
}
private static final Pattern XREF_PATTERN = Pattern.compile("([^\"]*)\\s*(\"((\\\"|[^\"])*)\")?");
private static final int XREF_ID_GROUP = 1;
private static final int XREF_QUOTED_STRING_GROUP = 3;
public OWLAnnotation parseXRef(String xref) {
Matcher matcher = XREF_PATTERN.matcher(xref);
if (matcher.matches()) {
OWLDataFactory df = getDataFactory();
String xrefQuotedString = matcher.group(XREF_QUOTED_STRING_GROUP);
// the quoted string is a description of the xref. I can't find anywhere to put this.
// Just add as a comment for now
Set xrefDescriptions;
if (xrefQuotedString != null) {
xrefDescriptions = new HashSet();
xrefDescriptions.add(df.getOWLAnnotation(df.getRDFSComment(), df.getOWLLiteral(xrefQuotedString)));
}
else {
xrefDescriptions = Collections.emptySet();
}
String xrefId = matcher.group(XREF_ID_GROUP).trim();
OBOIdType idType = OBOIdType.getIdType(xrefId);
OWLAnnotationValue annotationValue;
if (idType != null) {
annotationValue = getIRIFromOBOId(xrefId);
}
else {
annotationValue = getDataFactory().getOWLLiteral(xrefId);
}
OWLAnnotationProperty xrefProperty = df.getOWLAnnotationProperty(OBOVocabulary.XREF.getIRI());
return df.getOWLAnnotation(xrefProperty, annotationValue, xrefDescriptions);
}
else {
OWLDataFactory df = getDataFactory();
OWLAnnotationProperty xrefProperty = df.getOWLAnnotationProperty(OBOVocabulary.XREF.getIRI());
return df.getOWLAnnotation(xrefProperty, df.getOWLLiteral(xref));
}
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy