All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.geneweaver.io.DirectSave Maven / Gradle / Ivy

/*-
 * 
 * Copyright 2018, 2020  The Jackson Laboratory Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * 
 * @author Matthew Gerring
 */
package org.geneweaver.io;


import static org.geneweaver.io.connector.ChromosomeService.na;

import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.OutputStreamWriter;
import java.io.PrintStream;
import java.nio.file.Files;
import java.nio.file.Path;
import java.util.Collections;
import java.util.HashMap;
import java.util.Map;
import java.util.zip.GZIPOutputStream;

import org.geneweaver.domain.Entity;

/**
 * A simple function for importing static to find readers in a map 
 * and save to them.
 * 
 * @author gerrim
 *
 */
public class DirectSave implements AutoCloseable {
	
	private PrintStream log;
	private boolean verbose;
	
	public DirectSave() {
		this(null, false);
	}
	
	public DirectSave(PrintStream log, boolean verbose) {
		this.log = log;
		this.verbose = verbose;
	}

	/**
	 * This function uses the map to passed in to cache writers.
	 * @param e
	 * @param writers
	 * @param dir
	 * @param timer
	 * @return
	 */
	public Entity save(Entity e, Map, Map> paths, Map, Map> writers, Path dir, Timer timer) {
		return save(e, paths, writers, dir, timer, false);
	}
	
	/**
	 * This function uses the map passed in to cache writers.
	 * It is synchronized to avoid writing to the same file at the same
	 * time if multiple threads are used. 
	 * 
	 * @param e
	 * @param writers
	 * @param dir
	 * @param timer - may be null
	 * @return
	 */
	public Entity save(Entity e, Map, Map> paths, Map, Map> writers, Path dir, Timer timer, boolean append) {
		
		synchronized(e.getClass()) {
			try {
				if (!writers.containsKey(e.getClass())) {
					
					Path hpath = dir.resolve(e.getClass().getSimpleName()+"-header.csv");
					if (verbose) {
						if (log!=null) log.println("Creating header writer for "+hpath);
					}
					BufferedWriter header = Files.newBufferedWriter(hpath);
					header.write(e.getHeader());
					header.newLine();
					header.close();
					
					writers.put(e.getClass(), Collections.synchronizedMap(new HashMap<>()));
				}
				
				Map brs = writers.get(e.getClass());
				Map prs = paths.get(e.getClass());
				if (prs == null) {
					prs = Collections.synchronizedMap(new HashMap<>());
					paths.put(e.getClass(), prs);
				}

				String chr = e.getChr();
				if (chr==null) chr = na;
				if (!brs.containsKey(chr)) {
					Path pbody;
					if (chr.equals(Entity.NO_CHR)) {
						pbody = dir.resolve(e.getClass().getSimpleName()+".csv.gz");
					} else {
						pbody = dir.resolve(e.getClass().getSimpleName()+"-chr"+chr+".csv.gz");
					}
					if (verbose) {
						if (log!=null) log.println("Creating body writer for "+pbody);
					}
					BufferedWriter body = createWriter(pbody, append);
					brs.put(chr, body);
					prs.put(chr, pbody);
				}
				
				BufferedWriter writer = writers.get(e.getClass()).get(chr);
				writer.write(e.toCsv());
				writer.newLine();
				if (timer!=null) {
					Path path = paths.get(e.getClass()).get(chr);
					timer.time(path.toString(), verbose);
				}
			} catch (IOException ne) {
				throw new RuntimeException(ne);
			}
		}

		return e;
	}
	
	/**
	 * Create a GZip writer for use with writing bulk import files for neo4j,
	 * or in fact any gzip file.
	 * 
	 * @param pbody
	 * @param append
	 * @return
	 * @throws FileNotFoundException
	 * @throws IOException
	 */
	public static BufferedWriter createWriter(File pbody, boolean append) throws FileNotFoundException, IOException {
		return createWriter(pbody.toPath(), append);
	}

	/**
	 * Create a GZip writer for use with writing bulk import files for neo4j,
	 * or in fact any gzip file.
	 * 
	 * @param pbody
	 * @param append
	 * @return
	 * @throws FileNotFoundException
	 * @throws IOException
	 */
	public static BufferedWriter createWriter(Path pbody, boolean append) throws FileNotFoundException, IOException {
		BufferedWriter body = new BufferedWriter(new OutputStreamWriter(new GZIPOutputStream(new FileOutputStream(pbody.toFile(), append))));
		return body;
	}

	@Override
	public void close() throws Exception {
		// Nothing so far
	}

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy