feat(SpeechToText): Add support for EndOfPhraseSilenceTime and SplitTranscriptAtPhraseEnd to STT web

mamoonraja · mamoonraja · commit a009df5b712f · 2020-01-16T16:10:59.000-05:00
diff --git a/Examples/ExampleStreaming.cs b/Examples/ExampleStreaming.cs
@@ -1,5 +1,5 @@
 ﻿/**
-* (C) Copyright IBM Corp. 2015, 2019.
+* (C) Copyright IBM Corp. 2015, 2020.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
@@ -109,6 +109,7 @@ public bool Active
                     _service.SmartFormatting = true;
                     _service.SpeakerLabels = false;
                     _service.WordAlternativesThreshold = null;
+                    _service.EndOfPhraseSilenceTime = null;
                     _service.StartListening(OnRecognize, OnRecognizeSpeaker);
                 }
                 else if (!value && _service.IsListening)
diff --git a/Scripts/Services/SpeechToText/V1/SpeechToTextServiceExtension.cs b/Scripts/Services/SpeechToText/V1/SpeechToTextServiceExtension.cs
@@ -257,6 +257,35 @@ public float SilenceThreshold
         /// (optional)
         /// </summary>
         public float? ProcessingMetricsInterval { get; set; }
+        /// <summary>
+        /// If `true`, specifies the duration of the pause service splits a transcript into multiple final results.
+        /// If the service detects pauses or extended silence
+        /// before it reaches the end of the audio stream, its response can include multiple final results. Silence
+        /// indicates a point at which the speaker pauses between spoken words or phrases.
+        ///
+        /// Specify a value for the pause interval in the range of 0.0 to 120.0.
+        /// * A value greater than 0 specifies the interval that the service is to use for speech recognition.
+        /// * A value of 0 indicates that the service is to use the default interval. It is equivalent to omitting the
+        /// parameter.
+        ///
+        /// The default pause interval for most languages is 0.8 seconds; the default for Chinese is 0.6 seconds.
+        ///
+        /// See [End of phrase silence
+        /// time](https://cloud.ibm.com/docs/services/speech-to-text?topic=speech-to-text-output#silence_time).
+        /// <summary>
+        public double? EndOfPhraseSilenceTime { get; set; }
+        /// <summary>
+        /// If `true`, directs the service to split the transcript into
+        /// multiple final results based on semantic features of the input, for example, at the conclusion of meaningful
+        /// phrases such as sentences. The service bases its understanding of semantic features on the base language
+        /// model that you use with a request. Custom language models and grammars can also influence how and where the
+        /// service splits a transcript. By default, the service splits transcripts based solely on the pause interval.
+        ///
+        /// See [Split transcript at phrase
+        /// end](https://cloud.ibm.com/docs/services/speech-to-text?topic=speech-to-text-output#split_transcript).
+        /// (optional, default to false)
+        /// <summary>
+        public bool? SplitTranscriptAtPhraseEnd { get; set; }
         #endregion
 
         #region Sessionless - Streaming
@@ -498,6 +527,10 @@ private void SendStart()
                 start["grammar_name"] = GrammarName;
             if (Redaction != null)
                 start["redaction"] = Redaction;
+            if (EndOfPhraseSilenceTime != null)
+                start["end_of_phrase_silence_time"] = EndOfPhraseSilenceTime;
+            if (SplitTranscriptAtPhraseEnd != null)
+                start["split_transcript_at_phrase_end"] = SplitTranscriptAtPhraseEnd;
             start["processing_metrics"] = ProcessingMetrics;
             start["processing_metrics_interval"] = ProcessingMetricsInterval;
 

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`	`/**`
`2`		`-* (C) Copyright IBM Corp. 2015, 2019.`
	`2`	`+* (C) Copyright IBM Corp. 2015, 2020.`
`3`	`3`	`*`
`4`	`4`	`* Licensed under the Apache License, Version 2.0 (the "License");`
`5`	`5`	`* you may not use this file except in compliance with the License.`
`@@ -109,6 +109,7 @@ public bool Active`
`109`	`109`	`_service.SmartFormatting = true;`
`110`	`110`	`_service.SpeakerLabels = false;`
`111`	`111`	`_service.WordAlternativesThreshold = null;`
	`112`	`+ _service.EndOfPhraseSilenceTime = null;`
`112`	`113`	`_service.StartListening(OnRecognize, OnRecognizeSpeaker);`
`113`	`114`	`}`
`114`	`115`	`else if (!value && _service.IsListening)`