All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.daisy.pipeline.tts.osx.OSXSpeechEngine Maven / Gradle / Ivy

There is a newer version: 3.1.5
Show newest version
package org.daisy.pipeline.tts.osx;

import java.io.BufferedInputStream;
import java.io.BufferedOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.InputStream;
import java.io.PrintWriter;
import java.io.StringWriter;
import java.util.ArrayList;
import java.util.Collection;
import java.util.List;
import java.util.Scanner;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import javax.sound.sampled.AudioFormat;
import javax.sound.sampled.AudioInputStream;
import javax.sound.sampled.AudioSystem;

import net.sf.saxon.s9api.XdmNode;

import org.daisy.pipeline.audio.AudioBuffer;
import org.daisy.pipeline.tts.AudioBufferAllocator;
import org.daisy.pipeline.tts.AudioBufferAllocator.MemoryException;
import org.daisy.pipeline.tts.MarklessTTSEngine;
import org.daisy.pipeline.tts.SoundUtil;
import org.daisy.pipeline.tts.TTSEngine;
import org.daisy.pipeline.tts.TTSRegistry.TTSResource;
import org.daisy.pipeline.tts.TTSService.Mark;
import org.daisy.pipeline.tts.TTSService.SynthesisException;
import org.daisy.pipeline.tts.Voice;

public class OSXSpeechEngine extends MarklessTTSEngine {

	private AudioFormat mAudioFormat;
	private String mSayPath;
	private int mPriority;
	private final static int MIN_CHUNK_SIZE = 2048;

	public OSXSpeechEngine(OSXSpeechService service, String osxPath, int priority) {
		super(service);
		mPriority = priority;
		mSayPath = osxPath;
	}

	@Override
	public Collection synthesize(String sentence, XdmNode xmlSentence,
	        Voice voice, TTSResource threadResources,
	        AudioBufferAllocator bufferAllocator, boolean retry) throws SynthesisException,
	        InterruptedException, MemoryException {

		Collection result = new ArrayList();
		Process p = null;
		File waveOut = null;
		try {

			waveOut = File.createTempFile("pipeline", ".wav");
			p = Runtime.getRuntime().exec(
			        new String[]{
			                mSayPath, "--data-format=LEI16@22050", "-o",
			                waveOut.getAbsolutePath(), "-v", voice.name
			        });

			// write the sentence
			BufferedOutputStream out = new BufferedOutputStream((p.getOutputStream()));
			out.write(sentence.getBytes("utf-8"));
			out.close();

			p.waitFor();

			// read the wave on the standard output

			BufferedInputStream in = new BufferedInputStream(new FileInputStream(waveOut));
			AudioInputStream fi = AudioSystem.getAudioInputStream(in);

			if (mAudioFormat == null)
				mAudioFormat = fi.getFormat();

			while (true) {
				AudioBuffer b = bufferAllocator
				        .allocateBuffer(MIN_CHUNK_SIZE + fi.available());
				int ret = fi.read(b.data, 0, b.size);
				if (ret == -1) {
					//note: perhaps it would be better to call allocateBuffer()
					//somewhere else in order to avoid this extra call:
					bufferAllocator.releaseBuffer(b);
					break;
				}
				b.size = ret;
				result.add(b);
			}

			fi.close();
		} catch (MemoryException e) {
			SoundUtil.cancelFootPrint(result, bufferAllocator);
			p.destroy();
			throw e;
		} catch (InterruptedException e) {
			SoundUtil.cancelFootPrint(result, bufferAllocator);
			if (p != null)
				p.destroy();
			throw e;
		} catch (Exception e) {
			SoundUtil.cancelFootPrint(result, bufferAllocator);
			StringWriter sw = new StringWriter();
			e.printStackTrace(new PrintWriter(sw));
			if (p != null)
				p.destroy();
			throw new SynthesisException(e);
		} finally {
			if (waveOut != null)
				waveOut.delete();
		}
		return result;
	}

	@Override
	public AudioFormat getAudioOutputFormat() {
		return mAudioFormat;
	}

	@Override
	public Collection getAvailableVoices() throws SynthesisException,
	        InterruptedException {

		Collection result = new ArrayList();
		InputStream is;
		Process proc = null;
		Scanner scanner = null;
		Matcher mr;
		try {
			proc = Runtime.getRuntime().exec(new String[]{
			        mSayPath, "-v", "?"
			});
			is = proc.getInputStream();
			mr = Pattern.compile("(.*?)\\s+\\w{2}_\\w{2}").matcher("");
			scanner = new Scanner(is);
			while (scanner.hasNextLine()) {
				mr.reset(scanner.nextLine());
				if (mr.find()) {
					result.add(new Voice(getProvider().getName(), mr.group(1).trim()));
				}
			}
			is.close();
			proc.waitFor();
		} catch (Exception e) {
			if (proc != null) {
				proc.destroy();
			}
			throw new SynthesisException(e.getMessage(), e.getCause());
		} finally {
			if (scanner != null)
				scanner.close();
		}

		return result;
	}

	@Override
	public int getOverallPriority() {
		return mPriority;
	}

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy