All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.xerial.lens.XMLSilkLens Maven / Gradle / Ivy

There is a newer version: 3.4.0
Show newest version
/*--------------------------------------------------------------------------
 *  Copyright 2009 Taro L. Saito
 *
 *  Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 *--------------------------------------------------------------------------*/
//--------------------------------------
// XerialJ
//
// XMLSilkLens.java
// Since: Jul 28, 2009 11:41:27 AM
//
// $URL$
// $Author$
//--------------------------------------
package org.xerial.lens;

import java.io.Reader;
import java.io.StringWriter;
import java.io.Writer;

import org.xerial.core.XerialErrorCode;
import org.xerial.core.XerialException;
import org.xerial.silk.SilkWriter;
import org.xerial.util.ArrayDeque;
import org.xerial.util.xml.XMLAttribute;
import org.xml.sax.Attributes;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.ext.DefaultHandler2;
import org.xml.sax.helpers.XMLReaderFactory;

/**
 * XML to Silk format converter
 * 
 * @author leo
 * 
 */
public class XMLSilkLens {

    private static class XMLToSilkSAXHandler extends DefaultHandler2 {
        private SilkWriter context;

        private static class TagContext {
            public final String tagName;
            public final XMLAttribute attribute;
            public StringBuilder textBuf = new StringBuilder();
            public boolean isOpen = false;

            public TagContext(String tagName, XMLAttribute attribute) {
                this.tagName = tagName;
                this.attribute = attribute;
            }

            @Override
            public String toString() {
                return String.format("%s (%s) : %s", tagName, attribute.toXMLString(), textBuf
                        .toString());
            }
        }

        private ArrayDeque contextStack = new ArrayDeque();
        private ArrayDeque unopendContextStack = new ArrayDeque();

        public XMLToSilkSAXHandler(Writer out) {
            this.context = new SilkWriter(out);
        }

        public void characters(char[] ch, int start, int length) throws SAXException {
            TagContext tc = unopendContextStack.isEmpty() ? contextStack.getLast()
                    : unopendContextStack.getLast();
            tc.textBuf.append(ch, start, length);

        }

        public void endDocument() throws SAXException {
            context.endDocument();
        }

        public void endElement(String uri, String localName, String name) throws SAXException {

            // start node
            openContext();

            context = context.getParent();

            contextStack.removeLast();
        }

        public void processingInstruction(String target, String data) throws SAXException {
            context.commentLine("PI: " + data);
        }

        @Override
        public void comment(char[] ch, int start, int length) throws SAXException {
            context.commentLine(new String(ch, start, length));
        }

        public void startDocument() throws SAXException {
            context.preamble();
        }

        private void openContext() {

            for (TagContext tc : unopendContextStack) {
                // start node
                if (!tc.isOpen) {
                    context = context.node(tc.tagName);
                    for (int i = 0; i < tc.attribute.length(); ++i) {
                        context.attribute(tc.attribute.getName(i), tc.attribute.getValue(i));
                    }
                    if (tc.textBuf.length() > 0) {
                        String value = tc.textBuf.toString().trim();
                        if (value.length() > 0)
                            context.nodeValue(value);
                    }

                    tc.isOpen = true;
                }

                contextStack.addLast(tc);
            }

            unopendContextStack.clear();
        }

        public void startElement(String uri, String localName, String name, Attributes atts)
                throws SAXException {

            openContext();

            XMLAttribute at = new XMLAttribute();
            for (int i = 0; i < atts.getLength(); ++i)
                at.add(atts.getQName(i), atts.getValue(i));

            unopendContextStack.addLast(new TagContext(name, at));
        }

    }

    public static String toSilk(Reader xml) throws XerialException {

        StringWriter buf = new StringWriter();

        try {
            // Set namespaceAware to true to get a parser that corresponds to
            // the default SAX2 namespace feature setting.  This is necessary
            // because the default value from JAXP 1.0 was defined to be false.

            // Validation part 1: set whether validation is on
            //spf.setValidating(dtdValidate || xsdValidate);

            // Create a JAXP SAXParser

            // Get the encapsulated SAX XMLReader
            XMLReader xmlReader = XMLReaderFactory.createXMLReader();

            DefaultHandler2 ch = new XMLToSilkSAXHandler(buf);
            // Set the ContentHandler of the XMLReader
            xmlReader.setContentHandler(ch);
            xmlReader.setProperty("http://xml.org/sax/properties/lexical-handler", ch);

            xmlReader.parse(new InputSource(xml));

        }
        catch (Exception e) {
            throw new XerialException(XerialErrorCode.INVALID_STATE,
                    "failed to instantiate the XML parser: " + e);
        }

        //        XMLTreeWalker treeWalker = new XMLTreeWalker(xml);
        //      treeWalker.walk(new XMLToSilk(buf));

        return buf.toString();
    }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy