All Downloads are FREE. Search and download functionalities are using the official Maven repository.

gov.nasa.pds.harvest.meta.ex.BundleMetadataExtractor Maven / Gradle / Ivy

package gov.nasa.pds.harvest.meta.ex;

import java.util.ArrayList;
import java.util.List;

import javax.xml.xpath.XPathExpression;
import javax.xml.xpath.XPathFactory;

import org.w3c.dom.Document;
import org.w3c.dom.Node;
import org.w3c.dom.NodeList;

import gov.nasa.pds.harvest.meta.FieldMap;
import gov.nasa.pds.harvest.util.xml.XPathUtils;


/**
 * Extract metadata from a PDS bundle
 * @author karpenko
 */
public class BundleMetadataExtractor
{
    /**
     * Inner class to store bundle member (collection) information.
     * @author karpenko
     */
    public static class BundleMemberEntry
    {
        public String lid;
        public String lidvid;
        public boolean isPrimary = false;
        public String type;
        public String shortType;
        
        public String getLidVidKey()
        {
            String key = "ref_lidvid_" + shortType;
            return isPrimary ? key : key + "_secondary";
        }
        
        public String getLidKey()
        {
            String key = "ref_lid_" + shortType;
            return isPrimary ? key : key + "_secondary";
        }
    }
    
    
    private XPathExpression xBme;
    

    /**
     * Constructor
     * @throws Exception an exception
     */
    public BundleMetadataExtractor() throws Exception
    {
        XPathFactory xpf = XPathFactory.newInstance();
        xBme = XPathUtils.compileXPath(xpf, "/Product_Bundle/Bundle_Member_Entry");
    }
    
    
    /**
     * Extract bundle members (collections)
     * @param doc Parsed PDS label (XML DOM)
     * @return list of bundle members (collections)
     * @throws Exception an exception
     */
    public List extractBundleMemberEntries(Document doc) throws Exception
    {
        List list = new ArrayList();
        
        NodeList nodes = XPathUtils.getNodeList(doc, xBme);        
        if(nodes == null || nodes.getLength() == 0) return list;

        for(int i = 0; i < nodes.getLength(); i++)
        {
            BundleMemberEntry bme = createBme(nodes.item(i));
            list.add(bme);
        }
        
        return list;
    }


    /**
     * Add a collection reference (LID and LIDVID) from bundle member entry to the field map.
     * @param fmap keeps list of collection references
     * @param bme bundle member entry
     */
    public void addRefs(FieldMap fmap, BundleMemberEntry bme)
    {
        if(bme.lidvid != null)
        {
            fmap.addValue(bme.getLidVidKey(), bme.lidvid);
        }
        
        if(bme.lid != null)
        {
            fmap.addValue(bme.getLidKey(), bme.lid);
        }
        
        // Convert lidvid to lid only if lid is not available
        if(bme.lidvid != null && bme.lid == null)
        {
            int idx = bme.lidvid.indexOf("::");
            if(idx > 0)
            {
                String lid = bme.lidvid.substring(0, idx);
                fmap.addValue(bme.getLidKey(), lid);
            }
        }
    }

    
    private BundleMemberEntry createBme(Node root)
    {
        BundleMemberEntry bme = new BundleMemberEntry();
    
        NodeList nodes = root.getChildNodes();
        
        for(int i = 0; i < nodes.getLength(); i++)
        {
            Node node = nodes.item(i);
            String nodeName = node.getNodeName();
            
            if(nodeName.equals("lid_reference"))
            {
                bme.lid = node.getTextContent().trim();
            }
            else if(nodeName.equals("lidvid_reference"))
            {
                bme.lidvid = node.getTextContent().trim();
            }
            else if(nodeName.equals("reference_type"))
            {
                bme.type = node.getTextContent().trim();
                String[] tokens = bme.type.split("_");
                bme.shortType = tokens[tokens.length-1];
            }
            else if(nodeName.equals("member_status"))
            {
                String status = node.getTextContent().trim();
                bme.isPrimary = "Primary".equalsIgnoreCase(status); 
            }
        }
        
        if(bme.shortType == null) bme.shortType = "collection"; 

        return bme;
    }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy