All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.ibm.watson.speech_to_text.v1.model.CreateJobOptions Maven / Gradle / Ivy

/*
 * (C) Copyright IBM Corp. 2018, 2020.
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
 * an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations under the License.
 */
package com.ibm.watson.speech_to_text.v1.model;

import com.ibm.cloud.sdk.core.service.model.GenericModel;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.List;

/** The createJob options. */
public class CreateJobOptions extends GenericModel {

  /**
   * The identifier of the model that is to be used for the recognition request. See [Languages and
   * models](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-models#models).
   */
  public interface Model {
    /** ar-AR_BroadbandModel. */
    String AR_AR_BROADBANDMODEL = "ar-AR_BroadbandModel";
    /** de-DE_BroadbandModel. */
    String DE_DE_BROADBANDMODEL = "de-DE_BroadbandModel";
    /** de-DE_NarrowbandModel. */
    String DE_DE_NARROWBANDMODEL = "de-DE_NarrowbandModel";
    /** en-AU_BroadbandModel. */
    String EN_AU_BROADBANDMODEL = "en-AU_BroadbandModel";
    /** en-AU_NarrowbandModel. */
    String EN_AU_NARROWBANDMODEL = "en-AU_NarrowbandModel";
    /** en-GB_BroadbandModel. */
    String EN_GB_BROADBANDMODEL = "en-GB_BroadbandModel";
    /** en-GB_NarrowbandModel. */
    String EN_GB_NARROWBANDMODEL = "en-GB_NarrowbandModel";
    /** en-US_BroadbandModel. */
    String EN_US_BROADBANDMODEL = "en-US_BroadbandModel";
    /** en-US_NarrowbandModel. */
    String EN_US_NARROWBANDMODEL = "en-US_NarrowbandModel";
    /** en-US_ShortForm_NarrowbandModel. */
    String EN_US_SHORTFORM_NARROWBANDMODEL = "en-US_ShortForm_NarrowbandModel";
    /** es-AR_BroadbandModel. */
    String ES_AR_BROADBANDMODEL = "es-AR_BroadbandModel";
    /** es-AR_NarrowbandModel. */
    String ES_AR_NARROWBANDMODEL = "es-AR_NarrowbandModel";
    /** es-CL_BroadbandModel. */
    String ES_CL_BROADBANDMODEL = "es-CL_BroadbandModel";
    /** es-CL_NarrowbandModel. */
    String ES_CL_NARROWBANDMODEL = "es-CL_NarrowbandModel";
    /** es-CO_BroadbandModel. */
    String ES_CO_BROADBANDMODEL = "es-CO_BroadbandModel";
    /** es-CO_NarrowbandModel. */
    String ES_CO_NARROWBANDMODEL = "es-CO_NarrowbandModel";
    /** es-ES_BroadbandModel. */
    String ES_ES_BROADBANDMODEL = "es-ES_BroadbandModel";
    /** es-ES_NarrowbandModel. */
    String ES_ES_NARROWBANDMODEL = "es-ES_NarrowbandModel";
    /** es-MX_BroadbandModel. */
    String ES_MX_BROADBANDMODEL = "es-MX_BroadbandModel";
    /** es-MX_NarrowbandModel. */
    String ES_MX_NARROWBANDMODEL = "es-MX_NarrowbandModel";
    /** es-PE_BroadbandModel. */
    String ES_PE_BROADBANDMODEL = "es-PE_BroadbandModel";
    /** es-PE_NarrowbandModel. */
    String ES_PE_NARROWBANDMODEL = "es-PE_NarrowbandModel";
    /** fr-CA_BroadbandModel. */
    String FR_CA_BROADBANDMODEL = "fr-CA_BroadbandModel";
    /** fr-CA_NarrowbandModel. */
    String FR_CA_NARROWBANDMODEL = "fr-CA_NarrowbandModel";
    /** fr-FR_BroadbandModel. */
    String FR_FR_BROADBANDMODEL = "fr-FR_BroadbandModel";
    /** fr-FR_NarrowbandModel. */
    String FR_FR_NARROWBANDMODEL = "fr-FR_NarrowbandModel";
    /** it-IT_BroadbandModel. */
    String IT_IT_BROADBANDMODEL = "it-IT_BroadbandModel";
    /** it-IT_NarrowbandModel. */
    String IT_IT_NARROWBANDMODEL = "it-IT_NarrowbandModel";
    /** ja-JP_BroadbandModel. */
    String JA_JP_BROADBANDMODEL = "ja-JP_BroadbandModel";
    /** ja-JP_NarrowbandModel. */
    String JA_JP_NARROWBANDMODEL = "ja-JP_NarrowbandModel";
    /** ko-KR_BroadbandModel. */
    String KO_KR_BROADBANDMODEL = "ko-KR_BroadbandModel";
    /** ko-KR_NarrowbandModel. */
    String KO_KR_NARROWBANDMODEL = "ko-KR_NarrowbandModel";
    /** nl-NL_BroadbandModel. */
    String NL_NL_BROADBANDMODEL = "nl-NL_BroadbandModel";
    /** nl-NL_NarrowbandModel. */
    String NL_NL_NARROWBANDMODEL = "nl-NL_NarrowbandModel";
    /** pt-BR_BroadbandModel. */
    String PT_BR_BROADBANDMODEL = "pt-BR_BroadbandModel";
    /** pt-BR_NarrowbandModel. */
    String PT_BR_NARROWBANDMODEL = "pt-BR_NarrowbandModel";
    /** zh-CN_BroadbandModel. */
    String ZH_CN_BROADBANDMODEL = "zh-CN_BroadbandModel";
    /** zh-CN_NarrowbandModel. */
    String ZH_CN_NARROWBANDMODEL = "zh-CN_NarrowbandModel";
  }

  /**
   * If the job includes a callback URL, a comma-separated list of notification events to which to
   * subscribe. Valid events are * `recognitions.started` generates a callback notification when the
   * service begins to process the job. * `recognitions.completed` generates a callback notification
   * when the job is complete. You must use the **Check a job** method to retrieve the results
   * before they time out or are deleted. * `recognitions.completed_with_results` generates a
   * callback notification when the job is complete. The notification includes the results of the
   * request. * `recognitions.failed` generates a callback notification if the service experiences
   * an error while processing the job.
   *
   * 

The `recognitions.completed` and `recognitions.completed_with_results` events are * incompatible. You can specify only of the two events. * *

If the job includes a callback URL, omit the parameter to subscribe to the default events: * `recognitions.started`, `recognitions.completed`, and `recognitions.failed`. If the job does * not include a callback URL, omit the parameter. */ public interface Events { /** recognitions.started. */ String RECOGNITIONS_STARTED = "recognitions.started"; /** recognitions.completed. */ String RECOGNITIONS_COMPLETED = "recognitions.completed"; /** recognitions.completed_with_results. */ String RECOGNITIONS_COMPLETED_WITH_RESULTS = "recognitions.completed_with_results"; /** recognitions.failed. */ String RECOGNITIONS_FAILED = "recognitions.failed"; } protected InputStream audio; protected String contentType; protected String model; protected String callbackUrl; protected String events; protected String userToken; protected Long resultsTtl; protected String languageCustomizationId; protected String acousticCustomizationId; protected String baseModelVersion; protected Double customizationWeight; protected Long inactivityTimeout; protected List keywords; protected Float keywordsThreshold; protected Long maxAlternatives; protected Float wordAlternativesThreshold; protected Boolean wordConfidence; protected Boolean timestamps; protected Boolean profanityFilter; protected Boolean smartFormatting; protected Boolean speakerLabels; protected String customizationId; protected String grammarName; protected Boolean redaction; protected Boolean processingMetrics; protected Float processingMetricsInterval; protected Boolean audioMetrics; protected Double endOfPhraseSilenceTime; protected Boolean splitTranscriptAtPhraseEnd; protected Float speechDetectorSensitivity; protected Float backgroundAudioSuppression; /** Builder. */ public static class Builder { private InputStream audio; private String contentType; private String model; private String callbackUrl; private String events; private String userToken; private Long resultsTtl; private String languageCustomizationId; private String acousticCustomizationId; private String baseModelVersion; private Double customizationWeight; private Long inactivityTimeout; private List keywords; private Float keywordsThreshold; private Long maxAlternatives; private Float wordAlternativesThreshold; private Boolean wordConfidence; private Boolean timestamps; private Boolean profanityFilter; private Boolean smartFormatting; private Boolean speakerLabels; private String customizationId; private String grammarName; private Boolean redaction; private Boolean processingMetrics; private Float processingMetricsInterval; private Boolean audioMetrics; private Double endOfPhraseSilenceTime; private Boolean splitTranscriptAtPhraseEnd; private Float speechDetectorSensitivity; private Float backgroundAudioSuppression; private Builder(CreateJobOptions createJobOptions) { this.audio = createJobOptions.audio; this.contentType = createJobOptions.contentType; this.model = createJobOptions.model; this.callbackUrl = createJobOptions.callbackUrl; this.events = createJobOptions.events; this.userToken = createJobOptions.userToken; this.resultsTtl = createJobOptions.resultsTtl; this.languageCustomizationId = createJobOptions.languageCustomizationId; this.acousticCustomizationId = createJobOptions.acousticCustomizationId; this.baseModelVersion = createJobOptions.baseModelVersion; this.customizationWeight = createJobOptions.customizationWeight; this.inactivityTimeout = createJobOptions.inactivityTimeout; this.keywords = createJobOptions.keywords; this.keywordsThreshold = createJobOptions.keywordsThreshold; this.maxAlternatives = createJobOptions.maxAlternatives; this.wordAlternativesThreshold = createJobOptions.wordAlternativesThreshold; this.wordConfidence = createJobOptions.wordConfidence; this.timestamps = createJobOptions.timestamps; this.profanityFilter = createJobOptions.profanityFilter; this.smartFormatting = createJobOptions.smartFormatting; this.speakerLabels = createJobOptions.speakerLabels; this.customizationId = createJobOptions.customizationId; this.grammarName = createJobOptions.grammarName; this.redaction = createJobOptions.redaction; this.processingMetrics = createJobOptions.processingMetrics; this.processingMetricsInterval = createJobOptions.processingMetricsInterval; this.audioMetrics = createJobOptions.audioMetrics; this.endOfPhraseSilenceTime = createJobOptions.endOfPhraseSilenceTime; this.splitTranscriptAtPhraseEnd = createJobOptions.splitTranscriptAtPhraseEnd; this.speechDetectorSensitivity = createJobOptions.speechDetectorSensitivity; this.backgroundAudioSuppression = createJobOptions.backgroundAudioSuppression; } /** Instantiates a new builder. */ public Builder() {} /** * Instantiates a new builder with required properties. * * @param audio the audio */ public Builder(InputStream audio) { this.audio = audio; } /** * Builds a CreateJobOptions. * * @return the new CreateJobOptions instance */ public CreateJobOptions build() { return new CreateJobOptions(this); } /** * Adds an keyword to keywords. * * @param keyword the new keyword * @return the CreateJobOptions builder */ public Builder addKeyword(String keyword) { com.ibm.cloud.sdk.core.util.Validator.notNull(keyword, "keyword cannot be null"); if (this.keywords == null) { this.keywords = new ArrayList(); } this.keywords.add(keyword); return this; } /** * Set the audio. * * @param audio the audio * @return the CreateJobOptions builder */ public Builder audio(InputStream audio) { this.audio = audio; return this; } /** * Set the contentType. * * @param contentType the contentType * @return the CreateJobOptions builder */ public Builder contentType(String contentType) { this.contentType = contentType; return this; } /** * Set the model. * * @param model the model * @return the CreateJobOptions builder */ public Builder model(String model) { this.model = model; return this; } /** * Set the callbackUrl. * * @param callbackUrl the callbackUrl * @return the CreateJobOptions builder */ public Builder callbackUrl(String callbackUrl) { this.callbackUrl = callbackUrl; return this; } /** * Set the events. * * @param events the events * @return the CreateJobOptions builder */ public Builder events(String events) { this.events = events; return this; } /** * Set the userToken. * * @param userToken the userToken * @return the CreateJobOptions builder */ public Builder userToken(String userToken) { this.userToken = userToken; return this; } /** * Set the resultsTtl. * * @param resultsTtl the resultsTtl * @return the CreateJobOptions builder */ public Builder resultsTtl(long resultsTtl) { this.resultsTtl = resultsTtl; return this; } /** * Set the languageCustomizationId. * * @param languageCustomizationId the languageCustomizationId * @return the CreateJobOptions builder */ public Builder languageCustomizationId(String languageCustomizationId) { this.languageCustomizationId = languageCustomizationId; return this; } /** * Set the acousticCustomizationId. * * @param acousticCustomizationId the acousticCustomizationId * @return the CreateJobOptions builder */ public Builder acousticCustomizationId(String acousticCustomizationId) { this.acousticCustomizationId = acousticCustomizationId; return this; } /** * Set the baseModelVersion. * * @param baseModelVersion the baseModelVersion * @return the CreateJobOptions builder */ public Builder baseModelVersion(String baseModelVersion) { this.baseModelVersion = baseModelVersion; return this; } /** * Set the customizationWeight. * * @param customizationWeight the customizationWeight * @return the CreateJobOptions builder */ public Builder customizationWeight(Double customizationWeight) { this.customizationWeight = customizationWeight; return this; } /** * Set the inactivityTimeout. * * @param inactivityTimeout the inactivityTimeout * @return the CreateJobOptions builder */ public Builder inactivityTimeout(long inactivityTimeout) { this.inactivityTimeout = inactivityTimeout; return this; } /** * Set the keywords. Existing keywords will be replaced. * * @param keywords the keywords * @return the CreateJobOptions builder */ public Builder keywords(List keywords) { this.keywords = keywords; return this; } /** * Set the keywordsThreshold. * * @param keywordsThreshold the keywordsThreshold * @return the CreateJobOptions builder */ public Builder keywordsThreshold(Float keywordsThreshold) { this.keywordsThreshold = keywordsThreshold; return this; } /** * Set the maxAlternatives. * * @param maxAlternatives the maxAlternatives * @return the CreateJobOptions builder */ public Builder maxAlternatives(long maxAlternatives) { this.maxAlternatives = maxAlternatives; return this; } /** * Set the wordAlternativesThreshold. * * @param wordAlternativesThreshold the wordAlternativesThreshold * @return the CreateJobOptions builder */ public Builder wordAlternativesThreshold(Float wordAlternativesThreshold) { this.wordAlternativesThreshold = wordAlternativesThreshold; return this; } /** * Set the wordConfidence. * * @param wordConfidence the wordConfidence * @return the CreateJobOptions builder */ public Builder wordConfidence(Boolean wordConfidence) { this.wordConfidence = wordConfidence; return this; } /** * Set the timestamps. * * @param timestamps the timestamps * @return the CreateJobOptions builder */ public Builder timestamps(Boolean timestamps) { this.timestamps = timestamps; return this; } /** * Set the profanityFilter. * * @param profanityFilter the profanityFilter * @return the CreateJobOptions builder */ public Builder profanityFilter(Boolean profanityFilter) { this.profanityFilter = profanityFilter; return this; } /** * Set the smartFormatting. * * @param smartFormatting the smartFormatting * @return the CreateJobOptions builder */ public Builder smartFormatting(Boolean smartFormatting) { this.smartFormatting = smartFormatting; return this; } /** * Set the speakerLabels. * * @param speakerLabels the speakerLabels * @return the CreateJobOptions builder */ public Builder speakerLabels(Boolean speakerLabels) { this.speakerLabels = speakerLabels; return this; } /** * Set the customizationId. * * @param customizationId the customizationId * @return the CreateJobOptions builder */ public Builder customizationId(String customizationId) { this.customizationId = customizationId; return this; } /** * Set the grammarName. * * @param grammarName the grammarName * @return the CreateJobOptions builder */ public Builder grammarName(String grammarName) { this.grammarName = grammarName; return this; } /** * Set the redaction. * * @param redaction the redaction * @return the CreateJobOptions builder */ public Builder redaction(Boolean redaction) { this.redaction = redaction; return this; } /** * Set the processingMetrics. * * @param processingMetrics the processingMetrics * @return the CreateJobOptions builder */ public Builder processingMetrics(Boolean processingMetrics) { this.processingMetrics = processingMetrics; return this; } /** * Set the processingMetricsInterval. * * @param processingMetricsInterval the processingMetricsInterval * @return the CreateJobOptions builder */ public Builder processingMetricsInterval(Float processingMetricsInterval) { this.processingMetricsInterval = processingMetricsInterval; return this; } /** * Set the audioMetrics. * * @param audioMetrics the audioMetrics * @return the CreateJobOptions builder */ public Builder audioMetrics(Boolean audioMetrics) { this.audioMetrics = audioMetrics; return this; } /** * Set the endOfPhraseSilenceTime. * * @param endOfPhraseSilenceTime the endOfPhraseSilenceTime * @return the CreateJobOptions builder */ public Builder endOfPhraseSilenceTime(Double endOfPhraseSilenceTime) { this.endOfPhraseSilenceTime = endOfPhraseSilenceTime; return this; } /** * Set the splitTranscriptAtPhraseEnd. * * @param splitTranscriptAtPhraseEnd the splitTranscriptAtPhraseEnd * @return the CreateJobOptions builder */ public Builder splitTranscriptAtPhraseEnd(Boolean splitTranscriptAtPhraseEnd) { this.splitTranscriptAtPhraseEnd = splitTranscriptAtPhraseEnd; return this; } /** * Set the speechDetectorSensitivity. * * @param speechDetectorSensitivity the speechDetectorSensitivity * @return the CreateJobOptions builder */ public Builder speechDetectorSensitivity(Float speechDetectorSensitivity) { this.speechDetectorSensitivity = speechDetectorSensitivity; return this; } /** * Set the backgroundAudioSuppression. * * @param backgroundAudioSuppression the backgroundAudioSuppression * @return the CreateJobOptions builder */ public Builder backgroundAudioSuppression(Float backgroundAudioSuppression) { this.backgroundAudioSuppression = backgroundAudioSuppression; return this; } /** * Set the audio. * * @param audio the audio * @return the CreateJobOptions builder * @throws FileNotFoundException if the file could not be found */ public Builder audio(File audio) throws FileNotFoundException { this.audio = new FileInputStream(audio); return this; } } protected CreateJobOptions(Builder builder) { com.ibm.cloud.sdk.core.util.Validator.notNull(builder.audio, "audio cannot be null"); audio = builder.audio; contentType = builder.contentType; model = builder.model; callbackUrl = builder.callbackUrl; events = builder.events; userToken = builder.userToken; resultsTtl = builder.resultsTtl; languageCustomizationId = builder.languageCustomizationId; acousticCustomizationId = builder.acousticCustomizationId; baseModelVersion = builder.baseModelVersion; customizationWeight = builder.customizationWeight; inactivityTimeout = builder.inactivityTimeout; keywords = builder.keywords; keywordsThreshold = builder.keywordsThreshold; maxAlternatives = builder.maxAlternatives; wordAlternativesThreshold = builder.wordAlternativesThreshold; wordConfidence = builder.wordConfidence; timestamps = builder.timestamps; profanityFilter = builder.profanityFilter; smartFormatting = builder.smartFormatting; speakerLabels = builder.speakerLabels; customizationId = builder.customizationId; grammarName = builder.grammarName; redaction = builder.redaction; processingMetrics = builder.processingMetrics; processingMetricsInterval = builder.processingMetricsInterval; audioMetrics = builder.audioMetrics; endOfPhraseSilenceTime = builder.endOfPhraseSilenceTime; splitTranscriptAtPhraseEnd = builder.splitTranscriptAtPhraseEnd; speechDetectorSensitivity = builder.speechDetectorSensitivity; backgroundAudioSuppression = builder.backgroundAudioSuppression; } /** * New builder. * * @return a CreateJobOptions builder */ public Builder newBuilder() { return new Builder(this); } /** * Gets the audio. * *

The audio to transcribe. * * @return the audio */ public InputStream audio() { return audio; } /** * Gets the contentType. * *

The format (MIME type) of the audio. For more information about specifying an audio format, * see **Audio formats (content types)** in the method description. * * @return the contentType */ public String contentType() { return contentType; } /** * Gets the model. * *

The identifier of the model that is to be used for the recognition request. See [Languages * and models](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-models#models). * * @return the model */ public String model() { return model; } /** * Gets the callbackUrl. * *

A URL to which callback notifications are to be sent. The URL must already be successfully * allowlisted by using the **Register a callback** method. You can include the same callback URL * with any number of job creation requests. Omit the parameter to poll the service for job * completion and results. * *

Use the `user_token` parameter to specify a unique user-specified string with each job to * differentiate the callback notifications for the jobs. * * @return the callbackUrl */ public String callbackUrl() { return callbackUrl; } /** * Gets the events. * *

If the job includes a callback URL, a comma-separated list of notification events to which * to subscribe. Valid events are * `recognitions.started` generates a callback notification when * the service begins to process the job. * `recognitions.completed` generates a callback * notification when the job is complete. You must use the **Check a job** method to retrieve the * results before they time out or are deleted. * `recognitions.completed_with_results` generates * a callback notification when the job is complete. The notification includes the results of the * request. * `recognitions.failed` generates a callback notification if the service experiences * an error while processing the job. * *

The `recognitions.completed` and `recognitions.completed_with_results` events are * incompatible. You can specify only of the two events. * *

If the job includes a callback URL, omit the parameter to subscribe to the default events: * `recognitions.started`, `recognitions.completed`, and `recognitions.failed`. If the job does * not include a callback URL, omit the parameter. * * @return the events */ public String events() { return events; } /** * Gets the userToken. * *

If the job includes a callback URL, a user-specified string that the service is to include * with each callback notification for the job; the token allows the user to maintain an internal * mapping between jobs and notification events. If the job does not include a callback URL, omit * the parameter. * * @return the userToken */ public String userToken() { return userToken; } /** * Gets the resultsTtl. * *

The number of minutes for which the results are to be available after the job has finished. * If not delivered via a callback, the results must be retrieved within this time. Omit the * parameter to use a time to live of one week. The parameter is valid with or without a callback * URL. * * @return the resultsTtl */ public Long resultsTtl() { return resultsTtl; } /** * Gets the languageCustomizationId. * *

The customization ID (GUID) of a custom language model that is to be used with the * recognition request. The base model of the specified custom language model must match the model * specified with the `model` parameter. You must make the request with credentials for the * instance of the service that owns the custom model. By default, no custom language model is * used. See [Custom * models](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#custom-input). * *

**Note:** Use this parameter instead of the deprecated `customization_id` parameter. * * @return the languageCustomizationId */ public String languageCustomizationId() { return languageCustomizationId; } /** * Gets the acousticCustomizationId. * *

The customization ID (GUID) of a custom acoustic model that is to be used with the * recognition request. The base model of the specified custom acoustic model must match the model * specified with the `model` parameter. You must make the request with credentials for the * instance of the service that owns the custom model. By default, no custom acoustic model is * used. See [Custom * models](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#custom-input). * * @return the acousticCustomizationId */ public String acousticCustomizationId() { return acousticCustomizationId; } /** * Gets the baseModelVersion. * *

The version of the specified base model that is to be used with the recognition request. * Multiple versions of a base model can exist when a model is updated for internal improvements. * The parameter is intended primarily for use with custom models that have been upgraded for a * new base model. The default value depends on whether the parameter is used with or without a * custom model. See [Base model * version](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#version). * * @return the baseModelVersion */ public String baseModelVersion() { return baseModelVersion; } /** * Gets the customizationWeight. * *

If you specify the customization ID (GUID) of a custom language model with the recognition * request, the customization weight tells the service how much weight to give to words from the * custom language model compared to those from the base model for the current request. * *

Specify a value between 0.0 and 1.0. Unless a different customization weight was specified * for the custom model when it was trained, the default value is 0.3. A customization weight that * you specify overrides a weight that was specified when the custom model was trained. * *

The default value yields the best performance in general. Assign a higher value if your * audio makes frequent use of OOV words from the custom model. Use caution when setting the * weight: a higher value can improve the accuracy of phrases from the custom model's domain, but * it can negatively affect performance on non-domain phrases. * *

See [Custom * models](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#custom-input). * * @return the customizationWeight */ public Double customizationWeight() { return customizationWeight; } /** * Gets the inactivityTimeout. * *

The time in seconds after which, if only silence (no speech) is detected in streaming audio, * the connection is closed with a 400 error. The parameter is useful for stopping audio * submission from a live microphone when a user simply walks away. Use `-1` for infinity. See * [Inactivity * timeout](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#timeouts-inactivity). * * @return the inactivityTimeout */ public Long inactivityTimeout() { return inactivityTimeout; } /** * Gets the keywords. * *

An array of keyword strings to spot in the audio. Each keyword string can include one or * more string tokens. Keywords are spotted only in the final results, not in interim hypotheses. * If you specify any keywords, you must also specify a keywords threshold. Omit the parameter or * specify an empty array if you do not need to spot keywords. * *

You can spot a maximum of 1000 keywords with a single request. A single keyword can have a * maximum length of 1024 characters, though the maximum effective length for double-byte * languages might be shorter. Keywords are case-insensitive. * *

See [Keyword * spotting](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#keyword_spotting). * * @return the keywords */ public List keywords() { return keywords; } /** * Gets the keywordsThreshold. * *

A confidence value that is the lower bound for spotting a keyword. A word is considered to * match a keyword if its confidence is greater than or equal to the threshold. Specify a * probability between 0.0 and 1.0. If you specify a threshold, you must also specify one or more * keywords. The service performs no keyword spotting if you omit either parameter. See [Keyword * spotting](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#keyword_spotting). * * @return the keywordsThreshold */ public Float keywordsThreshold() { return keywordsThreshold; } /** * Gets the maxAlternatives. * *

The maximum number of alternative transcripts that the service is to return. By default, the * service returns a single transcript. If you specify a value of `0`, the service uses the * default value, `1`. See [Maximum * alternatives](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#max_alternatives). * * @return the maxAlternatives */ public Long maxAlternatives() { return maxAlternatives; } /** * Gets the wordAlternativesThreshold. * *

A confidence value that is the lower bound for identifying a hypothesis as a possible word * alternative (also known as "Confusion Networks"). An alternative word is considered if its * confidence is greater than or equal to the threshold. Specify a probability between 0.0 and * 1.0. By default, the service computes no alternative words. See [Word * alternatives](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#word_alternatives). * * @return the wordAlternativesThreshold */ public Float wordAlternativesThreshold() { return wordAlternativesThreshold; } /** * Gets the wordConfidence. * *

If `true`, the service returns a confidence measure in the range of 0.0 to 1.0 for each * word. By default, the service returns no word confidence scores. See [Word * confidence](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#word_confidence). * * @return the wordConfidence */ public Boolean wordConfidence() { return wordConfidence; } /** * Gets the timestamps. * *

If `true`, the service returns time alignment for each word. By default, no timestamps are * returned. See [Word * timestamps](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#word_timestamps). * * @return the timestamps */ public Boolean timestamps() { return timestamps; } /** * Gets the profanityFilter. * *

If `true`, the service filters profanity from all output except for keyword results by * replacing inappropriate words with a series of asterisks. Set the parameter to `false` to * return results with no censoring. Applies to US English transcription only. See [Profanity * filtering](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#profanity_filter). * * @return the profanityFilter */ public Boolean profanityFilter() { return profanityFilter; } /** * Gets the smartFormatting. * *

If `true`, the service converts dates, times, series of digits and numbers, phone numbers, * currency values, and internet addresses into more readable, conventional representations in the * final transcript of a recognition request. For US English, the service also converts certain * keyword strings to punctuation symbols. By default, the service performs no smart formatting. * *

**Note:** Applies to US English, Japanese, and Spanish transcription only. * *

See [Smart * formatting](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#smart_formatting). * * @return the smartFormatting */ public Boolean smartFormatting() { return smartFormatting; } /** * Gets the speakerLabels. * *

If `true`, the response includes labels that identify which words were spoken by which * participants in a multi-person exchange. By default, the service returns no speaker labels. * Setting `speaker_labels` to `true` forces the `timestamps` parameter to be `true`, regardless * of whether you specify `false` for the parameter. * *

**Note:** Applies to US English, Australian English, German, Japanese, Korean, and Spanish * (both broadband and narrowband models) and UK English (narrowband model) transcription only. * *

See [Speaker * labels](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#speaker_labels). * * @return the speakerLabels */ public Boolean speakerLabels() { return speakerLabels; } /** * Gets the customizationId. * *

**Deprecated.** Use the `language_customization_id` parameter to specify the customization * ID (GUID) of a custom language model that is to be used with the recognition request. Do not * specify both parameters with a request. * * @return the customizationId */ public String customizationId() { return customizationId; } /** * Gets the grammarName. * *

The name of a grammar that is to be used with the recognition request. If you specify a * grammar, you must also use the `language_customization_id` parameter to specify the name of the * custom language model for which the grammar is defined. The service recognizes only strings * that are recognized by the specified grammar; it does not recognize other custom words from the * model's words resource. See * [Grammars](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#grammars-input). * * @return the grammarName */ public String grammarName() { return grammarName; } /** * Gets the redaction. * *

If `true`, the service redacts, or masks, numeric data from final transcripts. The feature * redacts any number that has three or more consecutive digits by replacing each digit with an * `X` character. It is intended to redact sensitive numeric data, such as credit card numbers. By * default, the service performs no redaction. * *

When you enable redaction, the service automatically enables smart formatting, regardless of * whether you explicitly disable that feature. To ensure maximum security, the service also * disables keyword spotting (ignores the `keywords` and `keywords_threshold` parameters) and * returns only a single final transcript (forces the `max_alternatives` parameter to be `1`). * *

**Note:** Applies to US English, Japanese, and Korean transcription only. * *

See [Numeric * redaction](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#redaction). * * @return the redaction */ public Boolean redaction() { return redaction; } /** * Gets the processingMetrics. * *

If `true`, requests processing metrics about the service's transcription of the input audio. * The service returns processing metrics at the interval specified by the * `processing_metrics_interval` parameter. It also returns processing metrics for transcription * events, for example, for final and interim results. By default, the service returns no * processing metrics. * *

See [Processing * metrics](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-metrics#processing_metrics). * * @return the processingMetrics */ public Boolean processingMetrics() { return processingMetrics; } /** * Gets the processingMetricsInterval. * *

Specifies the interval in real wall-clock seconds at which the service is to return * processing metrics. The parameter is ignored unless the `processing_metrics` parameter is set * to `true`. * *

The parameter accepts a minimum value of 0.1 seconds. The level of precision is not * restricted, so you can specify values such as 0.25 and 0.125. * *

The service does not impose a maximum value. If you want to receive processing metrics only * for transcription events instead of at periodic intervals, set the value to a large number. If * the value is larger than the duration of the audio, the service returns processing metrics only * for transcription events. * *

See [Processing * metrics](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-metrics#processing_metrics). * * @return the processingMetricsInterval */ public Float processingMetricsInterval() { return processingMetricsInterval; } /** * Gets the audioMetrics. * *

If `true`, requests detailed information about the signal characteristics of the input * audio. The service returns audio metrics with the final transcription results. By default, the * service returns no audio metrics. * *

See [Audio * metrics](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-metrics#audio_metrics). * * @return the audioMetrics */ public Boolean audioMetrics() { return audioMetrics; } /** * Gets the endOfPhraseSilenceTime. * *

If `true`, specifies the duration of the pause interval at which the service splits a * transcript into multiple final results. If the service detects pauses or extended silence * before it reaches the end of the audio stream, its response can include multiple final results. * Silence indicates a point at which the speaker pauses between spoken words or phrases. * *

Specify a value for the pause interval in the range of 0.0 to 120.0. * A value greater than * 0 specifies the interval that the service is to use for speech recognition. * A value of 0 * indicates that the service is to use the default interval. It is equivalent to omitting the * parameter. * *

The default pause interval for most languages is 0.8 seconds; the default for Chinese is 0.6 * seconds. * *

See [End of phrase silence * time](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#silence_time). * * @return the endOfPhraseSilenceTime */ public Double endOfPhraseSilenceTime() { return endOfPhraseSilenceTime; } /** * Gets the splitTranscriptAtPhraseEnd. * *

If `true`, directs the service to split the transcript into multiple final results based on * semantic features of the input, for example, at the conclusion of meaningful phrases such as * sentences. The service bases its understanding of semantic features on the base language model * that you use with a request. Custom language models and grammars can also influence how and * where the service splits a transcript. By default, the service splits transcripts based solely * on the pause interval. * *

See [Split transcript at phrase * end](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-output#split_transcript). * * @return the splitTranscriptAtPhraseEnd */ public Boolean splitTranscriptAtPhraseEnd() { return splitTranscriptAtPhraseEnd; } /** * Gets the speechDetectorSensitivity. * *

The sensitivity of speech activity detection that the service is to perform. Use the * parameter to suppress word insertions from music, coughing, and other non-speech events. The * service biases the audio it passes for speech recognition by evaluating the input audio against * prior models of speech and non-speech activity. * *

Specify a value between 0.0 and 1.0: * 0.0 suppresses all audio (no speech is transcribed). * * 0.5 (the default) provides a reasonable compromise for the level of sensitivity. * 1.0 * suppresses no audio (speech detection sensitivity is disabled). * *

The values increase on a monotonic curve. See [Speech Activity * Detection](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#detection). * * @return the speechDetectorSensitivity */ public Float speechDetectorSensitivity() { return speechDetectorSensitivity; } /** * Gets the backgroundAudioSuppression. * *

The level to which the service is to suppress background audio based on its volume to * prevent it from being transcribed as speech. Use the parameter to suppress side conversations * or background noise. * *

Specify a value in the range of 0.0 to 1.0: * 0.0 (the default) provides no suppression * (background audio suppression is disabled). * 0.5 provides a reasonable level of audio * suppression for general usage. * 1.0 suppresses all audio (no audio is transcribed). * *

The values increase on a monotonic curve. See [Speech Activity * Detection](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-input#detection). * * @return the backgroundAudioSuppression */ public Float backgroundAudioSuppression() { return backgroundAudioSuppression; } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy