All Downloads are FREE. Search and download functionalities are using the official Maven repository.

gr.ekt.bteio.loaders.XMLDirectoryDataLoader Maven / Gradle / Ivy

/**
 * Copyright (c) 2007-2013, National Documentation Centre (EKT, www.ekt.gr)
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are
 * met:
 *
 *     Redistributions of source code must retain the above copyright
 *     notice, this list of conditions and the following disclaimer.
 *
 *     Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in
 *     the documentation and/or other materials provided with the
 *     distribution.
 *
 *     Neither the name of the National Documentation Centre nor the
 *     names of its contributors may be used to endorse or promote
 *     products derived from this software without specific prior written
 *     permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 * HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */
package gr.ekt.bteio.loaders;

import java.io.FilenameFilter;
import java.io.File;
import java.io.IOException;
import java.util.Map;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.xpath.XPathExpressionException;

import org.apache.log4j.Logger;

import org.w3c.dom.Document;
import org.xml.sax.SAXException;

import gr.ekt.bte.core.RecordSet;
import gr.ekt.bte.core.DataLoadingSpec;
import gr.ekt.bte.record.XPathRecord;
import gr.ekt.bte.dataloader.FileDataLoader;

public class XMLDirectoryDataLoader extends FileDataLoader {
    private Map xpath_string_map;
    private static Logger logger = Logger.getLogger(XMLDirectoryDataLoader.class);

    public XMLDirectoryDataLoader(String filename, Map xpath_string_map) {
        super(filename);
        this.xpath_string_map = xpath_string_map;
    }

    class XmlFilter implements FilenameFilter {
        @Override
        public boolean accept(File dir, String name) {
            return name.endsWith(".xml");
        }
    }

    @Override
    public RecordSet getRecords() {
        RecordSet ret = new RecordSet();
        File data_dir = new File(filename);
        if (!data_dir.isDirectory()) {
            return null;
        }
        File xmls[] = data_dir.listFiles(new XmlFilter());
        //TODO factor out the actual reading in order for it to be available for use from getRecords(DataLoadingSpec)
        DocumentBuilderFactory doc_factory = DocumentBuilderFactory.newInstance();
        doc_factory.setNamespaceAware(true);
        try {
            DocumentBuilder doc_builder = doc_factory.newDocumentBuilder();

            for (File fl : xmls) {
                try {
                    Document doc = doc_builder.parse(fl);
                    XPathRecord rec = new XPathRecord(doc, xpath_string_map);
                    ret.addRecord(rec);
                    //TODO handle the exceptions
                } catch(SAXException e) {
                    logger.info(e.getStackTrace());
                } catch(IOException e) {
                    logger.info(e.getStackTrace());
                } catch(XPathExpressionException e) {
                    logger.info(e.getStackTrace());
                }
            }
        } catch(ParserConfigurationException e) {
            //TODO throw MalformedSourceException
            logger.info(e.getStackTrace());
            return null;
        }

        return ret;
    }

    @Override
    public RecordSet getRecords(DataLoadingSpec spec) {
        //TODO implement when DataLoadingSpec gets defined.
        return getRecords();
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy