All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.restcomm.connect.asr.ISpeechAsr Maven / Gradle / Ivy

/*
 * TeleStax, Open Source Cloud Communications
 * Copyright 2011-2014, Telestax Inc and individual contributors
 * by the @authors tag.
 *
 * This program is free software: you can redistribute it and/or modify
 * under the terms of the GNU Affero General Public License as
 * published by the Free Software Foundation; either version 3 of
 * the License, or (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see 
 *
 */
package org.restcomm.connect.asr;

import akka.actor.ActorRef;
import akka.actor.UntypedActor;

import com.iSpeech.SpeechResult;
import com.iSpeech.iSpeechRecognizer;
import static com.iSpeech.iSpeechRecognizer.*;
import com.iSpeech.iSpeechRecognizer.SpeechRecognizerEvent;

import java.io.File;
import java.util.HashMap;
import java.util.Map;

import org.apache.commons.configuration.Configuration;

/**
 * @author [email protected] (Thomas Quintana)
 */
public final class ISpeechAsr extends UntypedActor implements SpeechRecognizerEvent {
    private static final Map languages = new HashMap();
    static {
        languages.put("en", "en-US");
        languages.put("en-gb", "en-GB");
        languages.put("es", "es-ES");
        languages.put("it", "it-IT");
        languages.put("fr", "fr-FR");
        languages.put("pl", "pl-PL");
        languages.put("pt", "pt-PT");
    }

    private final String key;
    private final boolean production;

    public ISpeechAsr(final Configuration configuration) {
        super();
        key = configuration.getString("api-key");
        production = configuration.getBoolean("api-key[@production]");
    }

    private AsrInfo info() {
        return new AsrInfo(languages.keySet());
    }

    @Override
    public void onReceive(final Object message) throws Exception {
        final Class klass = message.getClass();
        final ActorRef self = self();
        final ActorRef sender = sender();
        if (AsrRequest.class.equals(klass)) {
            final AsrRequest request = (AsrRequest) message;
            final Map attributes = request.attributes();
            try {
                if (attributes != null) {
                    sender.tell(new AsrResponse(recognize(message), attributes), self);
                } else {
                    sender.tell(new AsrResponse(recognize(message)), self);
                }
            } catch (final Exception exception) {
                if (attributes != null) {
                    sender.tell(new AsrResponse(exception, attributes), self);
                } else {
                    sender.tell(new AsrResponse(exception), self);
                }
            }
        } else if (GetAsrInfo.class.equals(klass)) {
            sender.tell(new AsrResponse(info()), self);
        }
    }

    private String recognize(final Object message) throws Exception {
        final AsrRequest request = (AsrRequest) message;
        final File file = request.file();
        final String language = languages.get(request.language());
        final iSpeechRecognizer recognizer = iSpeechRecognizer.getInstance(key, production);
        recognizer.setFreeForm(FREEFORM_DICTATION);
        recognizer.setLanguage(language);
        final SpeechResult results = recognizer.startFileRecognize("audio/x-wav", file, this);
        return results.Text;
    }

    @Override
    public void stateChanged(final int event, final int value, final Exception exception) {
        if (SpeechRecognizerEvent.RECORDING_ERROR == event) {
            // We don't use the recorder.
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy