org.projecthusky.communication.xd.xdm.XdmContents Maven / Gradle / Ivy
The newest version!
/*
* This code is made available under the terms of the Eclipse Public License v1.0
* in the github project https://github.com/project-husky/husky there you also
* find a list of the contributors and the license information.
*
* This project has been developed further and modified by the joined working group Husky
* on the basis of the eHealth Connector opensource project from June 28, 2021,
* whereas medshare GmbH is the initial and main contributor/author of the eHealth Connector.
*
*/
package org.projecthusky.communication.xd.xdm;
import java.io.BufferedInputStream;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.io.StringWriter;
import java.util.ArrayList;
import java.util.Enumeration;
import java.util.HashMap;
import java.util.LinkedList;
import java.util.List;
import java.util.Map;
import java.util.zip.ZipEntry;
import java.util.zip.ZipFile;
import jakarta.activation.DataHandler;
import jakarta.mail.util.ByteArrayDataSource;
import jakarta.xml.bind.JAXBContext;
import jakarta.xml.bind.JAXBException;
import jakarta.xml.bind.Marshaller;
import org.apache.commons.codec.digest.DigestUtils;
import org.apache.commons.io.IOUtils;
import org.projecthusky.common.utils.ZipCreator;
import org.projecthusky.communication.utils.XdsUtil;
import org.openehealth.ipf.commons.ihe.xds.core.metadata.Association;
import org.openehealth.ipf.commons.ihe.xds.core.metadata.Document;
import org.openehealth.ipf.commons.ihe.xds.core.metadata.DocumentEntry;
import org.openehealth.ipf.commons.ihe.xds.core.metadata.Folder;
import org.openehealth.ipf.commons.ihe.xds.core.requests.ProvideAndRegisterDocumentSet;
import org.openehealth.ipf.commons.ihe.xds.core.responses.ErrorCode;
import org.openehealth.ipf.commons.ihe.xds.core.responses.ErrorInfo;
import org.openehealth.ipf.commons.ihe.xds.core.responses.Severity;
import org.openehealth.ipf.commons.ihe.xds.core.responses.Status;
import org.openehealth.ipf.commons.ihe.xds.core.stub.ebrs30.lcm.SubmitObjectsRequest;
import org.openehealth.ipf.platform.camel.ihe.xds.core.converters.EbXML30Converters;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* The Class XdmContents represents all content of an XDM volume. This includes
* human readable informative files like README.TXT or INDEX.HTM and also
* machine readable files like METADATA.XML
*/
public class XdmContents {
/** The xdm index. */
private static final String XDM_INDEX = "INDEX.HTM";
/** The xdm metadata. */
private static final String XDM_METADATA = "METADATA.XML";
/** The xdm payload root. */
private static final String XDM_PAYLOAD_ROOT = "IHE_XDM";
/** The xdm readme. */
private static final String XDM_README = "README.TXT";
/** The index htm. */
private IndexHtm indexHtm;
/** The SLF4J logger instance. */
private final Logger log = LoggerFactory.getLogger(getClass());
/** The readme txt. */
private ReadmeTxt readmeTxt;
/** The response object. */
private final XdmRetrieveResponseTypeImpl resp;
/** The txn data. */
private List txnData;
/** The zip file. */
private ZipFile zipFile;
/**
* Instantiates a new xdm contents.
*/
public XdmContents() {
this.resp = new XdmRetrieveResponseTypeImpl();
this.txnData = new LinkedList<>();
}
/**
* Instantiates a new xdm contents with given INDEX.HTM and README.TXT files as
* according objects
*
* @param indexHtm the IndexHtm object (contains information about the contents
* of the volume)
* @param readmeTxt the ReadmeTxt object (contains information about the vendor
* and system that created the volume)
*/
public XdmContents(IndexHtm indexHtm, ReadmeTxt readmeTxt) {
this();
this.indexHtm = indexHtm;
this.readmeTxt = readmeTxt;
}
/**
* Instantiates a new xdm contents with a given filePath, pointing to an
* existing zip file.
*
* @param filePath the file path to an existing zip file, which holds the
* contents of an xdm volume
*/
public XdmContents(String filePath) {
this();
try {
this.zipFile = new ZipFile(filePath);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during read of " + filePath, e);
}
}
/**
* Instantiates a new xdm contents with given INDEX.HTM and README.TXT files,
* which will be read from given files paths.
*
* @param indexHtm the IndexHtm object (contains information about the contents
* of the volume)
* @param readmeTxt the ReadmeTxt object (contains information about the vendor
* and system that created the volume)
*/
public XdmContents(String indexHtm, String readmeTxt) {
this();
try (FileInputStream isIndexHtm = new FileInputStream(indexHtm)) {
this.indexHtm = new IndexHtm(isIndexHtm);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during reading of INDEX.HTM. ", e);
}
try (FileInputStream isReadme = new FileInputStream(readmeTxt)) {
this.readmeTxt = new ReadmeTxt(isReadme);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during reading of README.TXT. ", e);
}
}
/**
* Instantiates a new xdm contents with a given XDM volume as single zip file.
*
* @param zipFile the zip file
*/
public XdmContents(ZipFile zipFile) {
this();
try {
if (zipFile == null)
throw new IOException();
else {
this.zipFile = zipFile;
}
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during read of ZipFile", e);
}
}
/**
* Creates the metadata xml.
*
* @param txnData the txn data
* @return the XML resource
* @throws JAXBException
*/
private String createMetadataXml(ProvideAndRegisterDocumentSet txnData) throws JAXBException {
SubmitObjectsRequest submit = null;
DocumentEntry docEntry;
String hash;
Long size;
// Calculate Hash and Size for each document and set the information to
// the DocumentMetadata
for (final Document xdsDoc : txnData.getDocuments()) {
try (var is = xdsDoc.getDataHandler().getInputStream()) {
docEntry = xdsDoc.getDocumentEntry();
hash = DigestUtils.sha512Hex(xdsDoc.getDataHandler().getInputStream());
docEntry.setHash(hash);
size = Long.valueOf(IOUtils.toByteArray(is).length);
docEntry.setSize(size);
} catch (final Exception e) {
log.error("Error calculating hash and size. ", e);
return null;
}
}
// form the ebXML payload for the message
submit = EbXML30Converters.convert(txnData).getSubmitObjectsRequest();
final var marshaller = JAXBContext.newInstance(SubmitObjectsRequest.class).createMarshaller();
marshaller.setProperty(Marshaller.JAXB_FORMATTED_OUTPUT, Boolean.FALSE);
marshaller.setProperty(Marshaller.JAXB_FRAGMENT, Boolean.TRUE);
marshaller.setProperty(Marshaller.JAXB_ENCODING, "UTF8");
final var stringWriter = new StringWriter();
marshaller.marshal(submit, stringWriter);
return stringWriter.toString();
}
/**
* Creates the XDM volume contents and writes them to the given outputStream.
*
* @param outputStream the output stream, in which the contents will be written.
* @param txnData the SubmitTransactionData data (containing Metadata and
* the payload files themselves)
*/
public void createZip(OutputStream outputStream, ProvideAndRegisterDocumentSet txnData) {
this.txnData.add(txnData);
// Creating the ZipFileHelper Class
final var zip = new ZipCreator(outputStream);
// Add the path structure for documents in the Zip File
try {
zip.addZipItem("IHE_XDM/");
zip.addZipItem("IHE_XDM/SUBSET01/");
// Add each XdsDocument to the Zip File
var i = 0;
final List docList = txnData.getDocuments();
for (final Document xdsDoc : docList) {
i++;
final String filePath = XdsUtil.createXdmDocPathAndName(xdsDoc, i);
xdsDoc.getDocumentEntry().setUri(XdsUtil.createXdmDocName(xdsDoc, i));
// add the document
zip.addZipItem(xdsDoc.getDataHandler().getInputStream(), filePath);
}
// Add the necessary files to the zip container
zip.addZipItem(indexHtm.getInputStream(), XDM_INDEX);
zip.addZipItem(readmeTxt.getInputStream(), XDM_README);
final String metadataXml = createMetadataXml(txnData);
zip.addZipItem(this.getMetadataXmlInputStream(metadataXml), "IHE_XDM/SUBSET01/METADATA.XML");
zip.closeZip();
} catch (final IOException | JAXBException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during zip creation. ", e);
}
}
/**
* Creates the XDM volume contents and writes them to the given File(path)
*
* @param filePath the path to the file, in which the contents will be written.
* @param txnData the SubmitTransactionData data (containing Metadata and the
* payload files themselves)
*/
public void createZip(String filePath, ProvideAndRegisterDocumentSet txnData) {
final var targetFile = new File(filePath);
try (var outputStream = new FileOutputStream(targetFile)) {
createZip(outputStream, txnData);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("FileNotFoundException during target file creation. ", e);
}
}
/**
* Checks if the integritiy values (hash and size) for the documents are the
* same as in the metadata.
*
* @return false, if the values don´t match, true otherwise
*/
private boolean documentsIntegrityCheck() {
if (isSubmitTransactionDataNull(0))
return false;
DocumentEntry docMetadata = null;
String docHash = null;
long docSize = 0;
boolean integrityCheck = true;
for (var i = 0; i < txnData.size(); i++) {
for (final Document doc : txnData.get(i).getDocuments()) {
docMetadata = doc.getDocumentEntry();
try (var is = doc.getDataHandler().getInputStream()) {
docHash = DigestUtils.sha512Hex(is);
docSize = IOUtils.toByteArray(is).length;
} catch (final IOException e) {
log.error("IO Exception during zip document integrity check. ", e);
}
if ((docMetadata.getHash() == null) || !docMetadata.getHash().equals(docHash)) {
integrityCheck = checkHash(docMetadata, docHash, i);
}
if (docMetadata.getSize() == null || docMetadata.getSize() != docSize) {
integrityCheck = checkSize(docMetadata, docSize, i);
}
}
}
return integrityCheck;
}
private boolean checkHash(DocumentEntry docMetadata, String docHash, int index) {
if ((docMetadata.getHash() == null) || !docMetadata.getHash().equals(docHash)) {
log.warn("Integrity check failed for document hash in Submission Set: {} DocumentEntry with UUID: {}",
index, docMetadata.getEntryUuid());
this.resp.setStatus(Status.PARTIAL_SUCCESS);
final var error = new ErrorInfo();
error.setErrorCode(ErrorCode.NON_IDENTICAL_HASH);
error.setLocation(
"Document in submission set: " + index + " with Entry UUID: " + docMetadata.getEntryUuid());
error.setCustomErrorCode(
"The hash value of the document does not match the hash value, which is provided in the document metadata.");
error.setSeverity(Severity.WARNING);
if (this.resp.getErrorList() == null) {
this.resp.setErrorList(new LinkedList<>());
}
this.resp.getErrorList().add(error);
return false;
}
return true;
}
private boolean checkSize(DocumentEntry docMetadata, long docSize, int index) {
if (docMetadata.getSize() == null || docMetadata.getSize() != docSize) {
log.warn("Integrity check failed for document size in Submission Set: {} DocumentEntry with UUID: {}",
index, docMetadata.getEntryUuid());
this.resp.setStatus(Status.PARTIAL_SUCCESS);
final var error = new ErrorInfo();
error.setErrorCode(ErrorCode.NON_IDENTICAL_SIZE);
error.setLocation(
"Document in submission set: " + index + " with Entry UUID: " + docMetadata.getEntryUuid());
error.setCustomErrorCode(
"The size value of the document does not match the size value, which is provided in the document metadata.");
error.setSeverity(Severity.WARNING);
if (this.resp.getErrorList() == null) {
this.resp.setErrorList(new LinkedList<>());
}
this.resp.getErrorList().add(error);
return false;
}
return true;
}
/**
* Gets a list containing the documents together with the Document Metadata.
*
* @return the document and metadata list
*/
public List getDocumentAndMetadataList() {
return getDocumentAndMetadataList(0);
}
/**
* Gets a list containing the documents together with the Document Metadata for
* a specific submission set.
*
* @param submissionSetNumber the submission set number
* @return the document and metadata list
*/
public List getDocumentAndMetadataList(int submissionSetNumber) {
lazyLoadCheck();
if (isSubmitTransactionDataNull(submissionSetNumber)) {
return new LinkedList<>();
}
final ProvideAndRegisterDocumentSet std = txnData.get(submissionSetNumber);
final List docAndMetaList = new ArrayList<>();
for (final Document xdsDoc : std.getDocuments()) {
final var docAndMetadataEntry = new DocumentContentAndMetadata(xdsDoc, xdsDoc.getDocumentEntry());
docAndMetaList.add(docAndMetadataEntry);
}
return docAndMetaList;
}
/**
* Gets a list of documents (the actual payload of the XDM volume)
*
* @return the documents
*/
public List getDocumentList() {
return getDocumentList(0);
}
/**
* Gets a list of documents (the actual payload of the XDM volume) for a
* specific submission set.
*
* @param submissionSetNumber the submission set number
* @return the document list
*/
public List getDocumentList(int submissionSetNumber) {
lazyLoadCheck();
if (isSubmitTransactionDataNull(submissionSetNumber)) {
return new LinkedList<>();
}
return txnData.get(submissionSetNumber).getDocuments();
}
/**
* Gets the index htm.
*
* @return the index htm
*/
public IndexHtm getIndexHtm() {
lazyLoadCheck();
return indexHtm;
}
/**
* Gets the metadata xml input stream.
*
* @param metadataXml
*
* @return the metadata xml input stream
*/
private InputStream getMetadataXmlInputStream(String metadataXml) {
try {
final var bOS = new ByteArrayOutputStream();
bOS.write(metadataXml.getBytes());
return new ByteArrayInputStream(bOS.toByteArray());
} catch (final IOException e) {
log.error("IOException during reading the Metadata.xml InputStream ", e);
this.resp.setStatus(Status.FAILURE);
}
return null;
}
/**
* Gets the readme txt.
*
* @return the readme txt
*/
public ReadmeTxt getReadmeTxt() {
lazyLoadCheck();
return readmeTxt;
}
/**
* Given a full ZipEntry filespec, extracts the name of the folder (if present)
* under the IHE_XDM root specified by IHE XDM.
*
* @param zipEntryName the zip entry name
* @return the submission set dirspec
*/
private String getSubmissionSetDirspec(String zipEntryName) {
String result = null;
if (zipEntryName != null) {
final String[] components = zipEntryName.split("[\\\\/]");
if (components[0].equals(XDM_PAYLOAD_ROOT)) {
result = components[1];
}
}
return result;
}
/**
* Gets the XDM contents as OHT submit transaction data.
*
* @return the XDM contents as OHT submit transaction data
*/
public List getXdmContentsAsIpfSubmitTransactionData() {
lazyLoadCheck();
return txnData;
}
/**
* Gets the XDM contents as OHT XDSResponseType. This Object contains a flat
* list of all documents from all submission sets. It does not contain the full
* XDS Metadata for each document. If you want to get this data, please use the
* getDocumentAndMetadata method.
*
* @return The OHT XDSResponseType
*/
public XdmRetrieveResponseTypeImpl getXdmContentsAsOhtXdsResponseType() {
lazyLoadCheck();
for (var i = 0; i < txnData.size(); i++) {
resp.setAttachments(txnData.get(i).getDocuments());
}
return resp;
}
/**
* Tries accessing an XDM file inside ZIP using both MS-DOS and UNIX separators.
*
* @param zipFile the zip file
* @param subsetDirspec the subset dirspec
* @param subsetFilespec the subset filespec
* @param isRootFile the is root file
* @return the XDM zip entry
*/
private ZipEntry getXDMZipEntry(ZipFile zipFile, String subsetDirspec, String subsetFilespec, boolean isRootFile) {
ZipEntry result = null;
String zipFilespec;
if (!isRootFile) {
zipFilespec = XDM_PAYLOAD_ROOT + "\\" + subsetDirspec + "\\" + subsetFilespec.replace('/', '\\');
} else {
zipFilespec = subsetDirspec + subsetFilespec.replace('/', '\\');
}
result = zipFile.getEntry(zipFilespec);
if (result == null) {
zipFilespec = zipFilespec.replace('\\', '/');
result = zipFile.getEntry(zipFilespec);
}
return result;
}
/**
* Checks if Submit Transaction Data contains a valid dataset
*
* @param submissionSetNumber number of the dataset that should be checked
* @return true, if SubmitTransactionData has no valid data. false otherwise.
*/
private boolean isSubmitTransactionDataNull(int submissionSetNumber) {
if ((submissionSetNumber > txnData.size()) || (submissionSetNumber < 0)) {
return true;
} else {
if (txnData.isEmpty()) {
return true;
} else {
if (txnData.get(submissionSetNumber) == null) {
return true;
}
}
}
return false;
}
/**
* Checks, if the zipFile was already loaded
*/
private void lazyLoadCheck() {
if (txnData != null && zipFile != null && txnData.isEmpty()) {
loadXdmArchive();
}
}
/**
* Reads an XDM ZIP archive, so that the contents will be accessible with the
* get members. You have to use this method before you can access the contents.
*/
private void loadXdmArchive() {
this.resp.setStatus(Status.SUCCESS);
final Map results = new HashMap<>();
try {
List subsetDirspecs = unzip();
if (!subsetDirspecs.isEmpty()) {
// extract metadata
for (String subsetDirspec : subsetDirspecs) {
// we've found a new submission set
if (!results.containsKey(subsetDirspec)) {
// extract METADATA.XML
var metadata = extractMetadata(subsetDirspec);
if (metadata != null) {
results.put(subsetDirspec, metadata);
}
}
}
// load the descriptive files
loadDescriptiveFilesFromZipFile();
}
} catch (final IOException e) {
log.error("IO Error during loading of ZIP File. ", e);
this.resp.setStatus(Status.FAILURE);
return;
} catch (final Exception e) {
log.error("Exception during loading of ZIP File. ", e);
this.resp.setStatus(Status.FAILURE);
return;
}
this.txnData = results.values().stream().toList();
documentsIntegrityCheck();
}
/**
* unzip {@link ZipFile} and check size before.
*
* @return list of pathes of subdirectories
* @throws IOException
*/
private List unzip() throws IOException {
List results = new LinkedList<>();
final Enumeration zipEntries = zipFile.entries();
ZipEntry zipEntry = null;
int thresholdEntries = 10000;
int thresholdSize = 1000000000; // 1 GB
double thresholdRatio = 10;
int totalSizeArchive = 0;
int totalEntryArchive = 0;
// load the ZIP archive into memory
while (zipEntries.hasMoreElements()) {
zipEntry = zipEntries.nextElement();
totalEntryArchive++;
int nBytes = -1;
byte[] buffer = new byte[2048];
double totalSizeEntry = 0;
try (InputStream in = new BufferedInputStream(zipFile.getInputStream(zipEntry))) {
while ((nBytes = in.read(buffer)) > 0) {
totalSizeEntry += nBytes;
totalSizeArchive += nBytes;
double compressionRatio = totalSizeEntry / zipEntry.getCompressedSize();
if (compressionRatio > thresholdRatio) {
// ratio between compressed and uncompressed data is highly suspicious, looks
// like a Zip Bomb Attack
return new LinkedList<>();
}
}
if (totalSizeArchive > thresholdSize) {
// the uncompressed data size is too much for the application resource capacity
return new LinkedList<>();
}
if (totalEntryArchive > thresholdEntries) {
// too much entries in this archive, can lead to inodes exhaustion of the system
return new LinkedList<>();
}
if (!zipEntry.isDirectory() && zipEntry.getName().startsWith(XDM_PAYLOAD_ROOT)) {
results.add(getSubmissionSetDirspec(zipEntry.getName()));
}
}
}
return results;
}
/**
* extracts metadata XML from ZIP entry
*
* @param subsetDirspec path to zip entry
*
* @return extracted metadata as ProvideAndRegisterDocumentSet
* @throws IOException
* @throws JAXBException
*/
private ProvideAndRegisterDocumentSet extractMetadata(String subsetDirspec) throws IOException, JAXBException {
final var metadataEntry = getXDMZipEntry(zipFile, subsetDirspec, XDM_METADATA, false);
if (metadataEntry == null) {
log.warn("XDM submission set folder '{}' has no metadata file: {}", subsetDirspec, XDM_METADATA);
} else {
SubmitObjectsRequest request = null;
try (var in = zipFile.getInputStream(metadataEntry)) {
final var unmarshaller = JAXBContext.newInstance(SubmitObjectsRequest.class).createUnmarshaller();
request = (SubmitObjectsRequest) unmarshaller.unmarshal(in);
}
if (request != null) {
return getProvideAndRegisterDocumentSet(request, subsetDirspec);
}
}
return null;
}
private void loadDescriptiveFilesFromZipFile() {
try (InputStream isIndexHtm = zipFile.getInputStream(getXDMZipEntry(zipFile, "", XDM_INDEX, true))) {
this.indexHtm = new IndexHtm(isIndexHtm);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during loading INDEX.HTM. ", e);
}
try (InputStream isReadme = zipFile.getInputStream(getXDMZipEntry(zipFile, "", XDM_README, true))) {
this.readmeTxt = new ReadmeTxt(isReadme);
} catch (final IOException e) {
this.resp.setStatus(Status.FAILURE);
log.error("IO Exception during loading README.TXT. ", e);
}
}
private ProvideAndRegisterDocumentSet getProvideAndRegisterDocumentSet(SubmitObjectsRequest request,
String subsetDirspec) throws IOException {
ProvideAndRegisterDocumentSet docSet = importXDMMetadata(request);
for (Document xdsDocument : docSet.getDocuments()) {
var xdsDocumentEntry = xdsDocument.getDocumentEntry();
final String subsetFilespec = xdsDocumentEntry.getUri();
// xdsDocumentEntry.setUri(null); // is not
// a valid 'URI' value for a repository
// submission
final var docZipEntry = getXDMZipEntry(zipFile, subsetDirspec, subsetFilespec, false);
if (docZipEntry != null) {
try (var docStream = zipFile.getInputStream(docZipEntry)) {
var dataSource = new ByteArrayDataSource(docStream, xdsDocumentEntry.getMimeType());
xdsDocument.setDataHandler(new DataHandler(dataSource));
}
} else {
log.error("{} in XDM submission folder {} has XDSDocumentEntry.URI '{}' that cannot be found in ZIP",
XDM_METADATA, subsetDirspec, xdsDocumentEntry.getUri());
}
}
return docSet;
}
public ProvideAndRegisterDocumentSet importXDMMetadata(SubmitObjectsRequest txnData) {
var provideAndRegisterDocumentSet = new ProvideAndRegisterDocumentSet();
var submit = EbXML30Converters.convert(txnData);
for (DocumentEntry documentEntry : submit.getDocumentEntries()) {
if (documentEntry != null) {
provideAndRegisterDocumentSet.getDocuments().add(new Document(documentEntry, null));
}
}
for (Association association : submit.getAssociations()) {
if (association != null) {
provideAndRegisterDocumentSet.getAssociations().add(association);
}
}
for (Folder folder : submit.getFolders()) {
if (folder != null) {
provideAndRegisterDocumentSet.getFolders().add(folder);
}
}
provideAndRegisterDocumentSet.setSubmissionSet(submit.getSubmissionSet());
return provideAndRegisterDocumentSet;
}
}