org.jgrapht.nio.graphml.GraphMLEventDrivenImporter Maven / Gradle / Ivy
/*
* (C) Copyright 2016-2023, by Dimitrios Michail and Contributors.
*
* JGraphT : a free Java graph-theory library
*
* See the CONTRIBUTORS.md file distributed with this work for additional
* information regarding copyright ownership.
*
* This program and the accompanying materials are made available under the
* terms of the Eclipse Public License 2.0 which is available at
* http://www.eclipse.org/legal/epl-2.0, or the
* GNU Lesser General Public License v2.1 or later
* which is available at
* http://www.gnu.org/licenses/old-licenses/lgpl-2.1-standalone.html.
*
* SPDX-License-Identifier: EPL-2.0 OR LGPL-2.1-or-later
*/
package org.jgrapht.nio.graphml;
import org.jgrapht.*;
import org.jgrapht.alg.util.*;
import org.jgrapht.nio.*;
import org.xml.sax.*;
import org.xml.sax.helpers.*;
import javax.xml.*;
import javax.xml.parsers.*;
import javax.xml.transform.*;
import javax.xml.transform.stream.*;
import javax.xml.validation.*;
import java.io.*;
import java.util.*;
import java.util.Map.*;
/**
* Imports a graph from a GraphML data source.
*
*
* For a description of the format see
* http://en.wikipedia.org/wiki/ GraphML or the
* GraphML Primer.
*
*
*
* Below is small example of a graph in GraphML format.
*
*
* {@code
*
*
*
* yellow
*
*
*
*
* green
*
*
*
* blue
*
*
* red
*
*
*
* turquoise
*
*
* 1.0
*
*
* 1.0
*
*
* 2.0
*
*
*
*
*
* 1.1
*
*
*
* }
*
*
*
* In case the corresponding edge key with attr.name="weight" is defined, the importer also reads
* edge weights. Otherwise edge weights are ignored.
*
*
* GraphML-Attributes Values are read as string key-value pairs and passed using vertex and edge
* attribute consumers.
*
*
* The importer by default validates the input using the 1.0
* GraphML Schema. The user can
* (not recommended) disable the validation by calling {@link #setSchemaValidation(boolean)}.
*
* @author Dimitrios Michail
*/
public class GraphMLEventDrivenImporter
extends BaseEventDrivenImporter>
implements EventDrivenImporter>
{
private static final String GRAPHML_SCHEMA_FILENAME = "graphml.xsd";
private static final String XLINK_SCHEMA_FILENAME = "xlink.xsd";
// special attributes
private static final String EDGE_WEIGHT_DEFAULT_ATTRIBUTE_NAME = "weight";
private String edgeWeightAttributeName = EDGE_WEIGHT_DEFAULT_ATTRIBUTE_NAME;
private boolean schemaValidation;
/**
* Constructs a new importer.
*/
public GraphMLEventDrivenImporter()
{
this.schemaValidation = true;
}
/**
* Get the attribute name for edge weights
*
* @return the attribute name
*/
public String getEdgeWeightAttributeName()
{
return edgeWeightAttributeName;
}
/**
* Set the attribute name to use for edge weights.
*
* @param edgeWeightAttributeName the attribute name
*/
public void setEdgeWeightAttributeName(String edgeWeightAttributeName)
{
if (edgeWeightAttributeName == null) {
throw new IllegalArgumentException("Edge weight attribute name cannot be null");
}
this.edgeWeightAttributeName = edgeWeightAttributeName;
}
/**
* Whether the importer validates the input
*
* @return true if the importer validates the input
*/
public boolean isSchemaValidation()
{
return schemaValidation;
}
/**
* Set whether the importer should validate the input
*
* @param schemaValidation value for schema validation
*/
public void setSchemaValidation(boolean schemaValidation)
{
this.schemaValidation = schemaValidation;
}
@Override
public void importInput(Reader input)
{
try {
// parse
XMLReader xmlReader = createXMLReader();
GraphMLHandler handler = new GraphMLHandler();
xmlReader.setContentHandler(handler);
xmlReader.setErrorHandler(handler);
notifyImportEvent(ImportEvent.START);
xmlReader.parse(new InputSource(input));
handler.notifyInterestedParties();
notifyImportEvent(ImportEvent.END);
} catch (Exception e) {
throw new ImportException("Failed to parse GraphML", e);
}
}
private XMLReader createXMLReader()
throws ImportException
{
try {
SchemaFactory schemaFactory =
SchemaFactory.newInstance(XMLConstants.W3C_XML_SCHEMA_NS_URI);
// create parser
SAXParserFactory spf = SAXParserFactory.newInstance();
if (schemaValidation) {
// load schema
InputStream xsdStream =
Thread.currentThread().getContextClassLoader().getResourceAsStream(
GRAPHML_SCHEMA_FILENAME);
if (xsdStream == null) {
throw new ImportException("Failed to locate GraphML xsd");
}
InputStream xlinkStream =
Thread.currentThread().getContextClassLoader().getResourceAsStream(
XLINK_SCHEMA_FILENAME);
if (xlinkStream == null) {
throw new ImportException("Failed to locate XLink xsd");
}
Source[] sources = new Source[2];
sources[0] = new StreamSource(xlinkStream);
sources[1] = new StreamSource(xsdStream);
Schema schema = schemaFactory.newSchema(sources);
spf.setSchema(schema);
}
spf.setNamespaceAware(true);
SAXParser saxParser = spf.newSAXParser();
// create reader
return saxParser.getXMLReader();
} catch (Exception e) {
throw new ImportException("Failed to parse GraphML", e);
}
}
// content handler
private class GraphMLHandler
extends DefaultHandler
{
private static final String GRAPH = "graph";
private static final String GRAPH_ID = "id";
private static final String NODE = "node";
private static final String NODE_ID = "id";
private static final String EDGE = "edge";
private static final String ALL = "all";
private static final String EDGE_SOURCE = "source";
private static final String EDGE_TARGET = "target";
private static final String KEY = "key";
private static final String KEY_FOR = "for";
private static final String KEY_ATTR_NAME = "attr.name";
private static final String KEY_ATTR_TYPE = "attr.type";
private static final String KEY_ID = "id";
private static final String DEFAULT = "default";
private static final String DATA = "data";
private static final String DATA_KEY = "key";
// collect graph elements here
private Map nodes;
private List edges;
// record state of parser
private boolean insideDefault;
private boolean insideData;
// temporary state while reading elements
// stack needed due to nested graphs in GraphML
private Data currentData;
private Key currentKey;
private Deque currentGraphElement;
// collect custom keys
private Map nodeValidKeys;
private Map edgeValidKeys;
// notify interested parties
public void notifyInterestedParties()
throws ImportException
{
if (nodes.isEmpty()) {
return;
}
// nodes
Set graphNodes = new HashSet<>();
for (Entry en : nodes.entrySet()) {
String nodeId = en.getKey();
if (nodeId == null) {
throw new ImportException("Node id missing");
}
// create attributes
Map collectedAttributes = en.getValue().attributes;
Map finalAttributes = new LinkedHashMap<>();
for (Key validKey : nodeValidKeys.values()) {
String validId = validKey.id;
AttributeType validType = validKey.type;
if (collectedAttributes.containsKey(validId)) {
finalAttributes.put(
validKey.attributeName,
new DefaultAttribute<>(collectedAttributes.get(validId), validType));
} else if (validKey.defaultValue != null) {
finalAttributes.put(
validKey.attributeName,
new DefaultAttribute<>(validKey.defaultValue, validType));
}
}
notifyVertex(nodeId);
for (String key : finalAttributes.keySet()) {
notifyVertexAttribute(nodeId, key, finalAttributes.get(key));
}
graphNodes.add(nodeId);
}
// check how to handle special edge weight
boolean handleSpecialEdgeWeights = false;
double defaultSpecialEdgeWeight = Graph.DEFAULT_EDGE_WEIGHT;
for (Key k : edgeValidKeys.values()) {
if (k.attributeName.equals(edgeWeightAttributeName)) {
handleSpecialEdgeWeights = true;
String defaultValue = k.defaultValue;
try {
if (defaultValue != null) {
defaultSpecialEdgeWeight = Double.parseDouble(defaultValue);
}
} catch (NumberFormatException e) {
// ignore
}
// first key only which maps to special edge "weight"
break;
}
}
// create edges
for (GraphElement p : edges) {
if (p.id1 == null) {
throw new ImportException("Edge source vertex missing");
}
if (!graphNodes.contains(p.id1)) {
throw new ImportException("Source vertex " + p.id1 + " not found");
}
if (p.id2 == null) {
throw new ImportException("Edge target vertex missing");
}
if (!graphNodes.contains(p.id2)) {
throw new ImportException("Target vertex " + p.id2 + " not found");
}
// create attributes
Map collectedAttributes = p.attributes;
Map finalAttributes = new LinkedHashMap<>();
for (Key validKey : edgeValidKeys.values()) {
String validId = validKey.id;
AttributeType validType = validKey.type;
if (collectedAttributes.containsKey(validId)) {
finalAttributes.put(
validKey.attributeName,
new DefaultAttribute<>(collectedAttributes.get(validId), validType));
} else {
if (validKey.defaultValue != null) {
finalAttributes.put(
validKey.attributeName,
new DefaultAttribute<>(validKey.defaultValue, validType));
}
}
}
Triple te = Triple.of(p.id1, p.id2, null);
// special handling for weighted graphs
if (handleSpecialEdgeWeights) {
if (finalAttributes.containsKey(edgeWeightAttributeName)) {
try {
te.setThird(
Double.parseDouble(
finalAttributes.get(edgeWeightAttributeName).getValue()));
} catch (NumberFormatException nfe) {
te.setThird(defaultSpecialEdgeWeight);
}
}
}
notifyEdge(te);
for (String key : finalAttributes.keySet()) {
notifyEdgeAttribute(te, key, finalAttributes.get(key));
}
}
}
@Override
public void startDocument()
throws SAXException
{
nodes = new LinkedHashMap<>();
edges = new ArrayList<>();
nodeValidKeys = new LinkedHashMap<>();
edgeValidKeys = new LinkedHashMap<>();
insideDefault = false;
insideData = false;
currentKey = null;
currentData = null;
currentGraphElement = new ArrayDeque<>();
currentGraphElement.push(new GraphElement("graphml"));
}
@Override
public void startElement(String uri, String localName, String qName, Attributes attributes)
throws SAXException
{
switch (localName) {
case GRAPH:
currentGraphElement.push(new GraphElement(findAttribute(GRAPH_ID, attributes)));
break;
case NODE:
currentGraphElement.push(new GraphElement(findAttribute(NODE_ID, attributes)));
break;
case EDGE:
currentGraphElement.push(
new GraphElement(
findAttribute(EDGE_SOURCE, attributes),
findAttribute(EDGE_TARGET, attributes)));
break;
case KEY:
String keyId = findAttribute(KEY_ID, attributes);
String keyFor = findAttribute(KEY_FOR, attributes);
String keyAttrName = findAttribute(KEY_ATTR_NAME, attributes);
String keyAttrType = findAttribute(KEY_ATTR_TYPE, attributes);
currentKey = new Key(keyId, keyAttrName, null, null);
if (keyAttrType != null) {
currentKey.type = AttributeType.create(keyAttrType);
}
if (keyFor != null) {
switch (keyFor) {
case EDGE:
currentKey.target = KeyTarget.EDGE;
break;
case NODE:
currentKey.target = KeyTarget.NODE;
break;
case ALL:
currentKey.target = KeyTarget.ALL;
break;
}
}
break;
case DEFAULT:
insideDefault = true;
break;
case DATA:
insideData = true;
currentData = new Data(findAttribute(DATA_KEY, attributes), null);
break;
default:
break;
}
}
@Override
public void endElement(String uri, String localName, String qName)
throws SAXException
{
switch (localName) {
case GRAPH:
currentGraphElement.pop();
break;
case NODE:
GraphElement currentNode = currentGraphElement.pop();
if (nodes.containsKey(currentNode.id1)) {
throw new SAXException("Node with id " + currentNode.id1 + " already exists");
}
nodes.put(currentNode.id1, currentNode);
break;
case EDGE:
GraphElement currentEdge = currentGraphElement.pop();
edges.add(currentEdge);
break;
case KEY:
if (currentKey.isValid()) {
switch (currentKey.target) {
case NODE:
nodeValidKeys.put(currentKey.id, currentKey);
break;
case EDGE:
edgeValidKeys.put(currentKey.id, currentKey);
break;
case ALL:
nodeValidKeys.put(currentKey.id, currentKey);
edgeValidKeys.put(currentKey.id, currentKey);
break;
}
}
currentKey = null;
break;
case DEFAULT:
insideDefault = false;
break;
case DATA:
if (currentData.isValid()) {
currentGraphElement.peek().attributes.put(currentData.key, currentData.value);
}
insideData = false;
currentData = null;
break;
default:
break;
}
}
@Override
public void characters(char ch[], int start, int length)
throws SAXException
{
if (insideDefault) {
if (currentKey.defaultValue != null) {
currentKey.defaultValue += new String(ch, start, length);
} else {
currentKey.defaultValue = new String(ch, start, length);
}
} else if (insideData) {
if (currentData.value != null) {
currentData.value += new String(ch, start, length);
} else {
currentData.value = new String(ch, start, length);
}
}
}
@Override
public void warning(SAXParseException e)
throws SAXException
{
throw e;
}
public void error(SAXParseException e)
throws SAXException
{
throw e;
}
public void fatalError(SAXParseException e)
throws SAXException
{
throw e;
}
private String findAttribute(String localName, Attributes attributes)
{
for (int i = 0; i < attributes.getLength(); i++) {
String attrLocalName = attributes.getLocalName(i);
if (attrLocalName.equals(localName)) {
return attributes.getValue(i);
}
}
return null;
}
}
// ----- Helper classes for storing partial parser results -----
private enum KeyTarget
{
NODE,
EDGE,
ALL
}
private class Key
{
String id;
String attributeName;
String defaultValue;
KeyTarget target;
AttributeType type;
public Key(String id, String attributeName, String defaultValue, KeyTarget target)
{
this.id = id;
this.attributeName = attributeName;
this.defaultValue = defaultValue;
this.target = target;
this.type = AttributeType.STRING;
}
public boolean isValid()
{
return id != null && attributeName != null && target != null;
}
}
private class Data
{
String key;
String value;
public Data(String key, String value)
{
this.key = key;
this.value = value;
}
public boolean isValid()
{
return key != null && value != null;
}
}
private class GraphElement
{
String id1;
String id2;
Map attributes;
public GraphElement(String id1)
{
this.id1 = id1;
this.id2 = null;
this.attributes = new LinkedHashMap();
}
public GraphElement(String id1, String id2)
{
this.id1 = id1;
this.id2 = id2;
this.attributes = new LinkedHashMap();
}
}
}