@@ -218,6 +218,7 @@ def recognize(
218218 end_of_phrase_silence_time : Optional [float ] = None ,
219219 split_transcript_at_phrase_end : Optional [bool ] = None ,
220220 speech_detector_sensitivity : Optional [float ] = None ,
221+ sad_module : Optional [int ] = None ,
221222 background_audio_suppression : Optional [float ] = None ,
222223 low_latency : Optional [bool ] = None ,
223224 character_insertion_bias : Optional [float ] = None ,
@@ -351,8 +352,9 @@ def recognize(
351352 activity is detected in the stream. This can be used both in standard and
352353 low latency mode. This feature enables client applications to know that
353354 some words/speech has been detected and the service is in the process of
354- decoding. This can be used in lieu of interim results in standard mode. See
355- [Using speech recognition
355+ decoding. This can be used in lieu of interim results in standard mode. Use
356+ `sad_module: 2` to increase accuracy and performance in detecting speech
357+ boundaries within the audio stream. See [Using speech recognition
356358 parameters](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-service-features#features-parameters).
357359 :param str language_customization_id: (optional) The customization ID
358360 (GUID) of a custom language model that is to be used with the recognition
@@ -555,6 +557,12 @@ def recognize(
555557 sensitivity](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#detection-parameters-sensitivity)
556558 and [Language model
557559 support](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#detection-support).
560+ :param int sad_module: (optional) Detects speech boundaries within the
561+ audio stream with better performance, improved noise suppression, faster
562+ responsiveness, and increased accuracy.
563+ Specify `sad_module: 2`
564+ See [Speech Activity Detection
565+ (SAD)](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#sad).
558566 :param float background_audio_suppression: (optional) The level to which
559567 the service is to suppress background audio based on its volume to prevent
560568 it from being transcribed as speech. Use the parameter to suppress side
@@ -647,6 +655,7 @@ def recognize(
647655 'end_of_phrase_silence_time' : end_of_phrase_silence_time ,
648656 'split_transcript_at_phrase_end' : split_transcript_at_phrase_end ,
649657 'speech_detector_sensitivity' : speech_detector_sensitivity ,
658+ 'sad_module' : sad_module ,
650659 'background_audio_suppression' : background_audio_suppression ,
651660 'low_latency' : low_latency ,
652661 'character_insertion_bias' : character_insertion_bias ,
@@ -845,6 +854,7 @@ def create_job(
845854 end_of_phrase_silence_time : Optional [float ] = None ,
846855 split_transcript_at_phrase_end : Optional [bool ] = None ,
847856 speech_detector_sensitivity : Optional [float ] = None ,
857+ sad_module : Optional [int ] = None ,
848858 background_audio_suppression : Optional [float ] = None ,
849859 low_latency : Optional [bool ] = None ,
850860 character_insertion_bias : Optional [float ] = None ,
@@ -1244,6 +1254,12 @@ def create_job(
12441254 sensitivity](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#detection-parameters-sensitivity)
12451255 and [Language model
12461256 support](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#detection-support).
1257+ :param int sad_module: (optional) Detects speech boundaries within the
1258+ audio stream with better performance, improved noise suppression, faster
1259+ responsiveness, and increased accuracy.
1260+ Specify `sad_module: 2`
1261+ See [Speech Activity Detection
1262+ (SAD)](https://cloud.ibm.com/docs/speech-to-text?topic=speech-to-text-detection#sad).
12471263 :param float background_audio_suppression: (optional) The level to which
12481264 the service is to suppress background audio based on its volume to prevent
12491265 it from being transcribed as speech. Use the parameter to suppress side
@@ -1341,6 +1357,7 @@ def create_job(
13411357 'end_of_phrase_silence_time' : end_of_phrase_silence_time ,
13421358 'split_transcript_at_phrase_end' : split_transcript_at_phrase_end ,
13431359 'speech_detector_sensitivity' : speech_detector_sensitivity ,
1360+ 'sad_module' : sad_module ,
13441361 'background_audio_suppression' : background_audio_suppression ,
13451362 'low_latency' : low_latency ,
13461363 'character_insertion_bias' : character_insertion_bias ,
0 commit comments