lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.36.0 vs lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.37.0

- old
+ new

@@ -188,22 +188,27 @@ # @!attribute [rw] enable_speaker_diarization # @return [true, false] # *Optional* If 'true', enables speaker detection for each recognized word in # the top alternative of the recognition result using a speaker_tag provided # in the WordInfo. - # Note: When this is true, we send all the words from the beginning of the + # Note: Use diarization_config instead. + # @!attribute [rw] diarization_speaker_count + # @return [Integer] + # *Optional* + # If set, specifies the estimated number of speakers in the conversation. + # Defaults to '2'. Ignored unless enable_speaker_diarization is set to true. + # Note: Use diarization_config instead. + # @!attribute [rw] diarization_config + # @return [Google::Cloud::Speech::V1p1beta1::SpeakerDiarizationConfig] + # *Optional* Config to enable speaker diarization and set additional + # parameters to make diarization better suited for your application. + # Note: When this is enabled, we send all the words from the beginning of the # audio for the top alternative in every consecutive STREAMING responses. # This is done in order to improve our speaker tags as our models learn to # identify the speakers in the conversation over time. # For non-streaming requests, the diarization results will be provided only # in the top alternative of the FINAL SpeechRecognitionResult. - # @!attribute [rw] diarization_speaker_count - # @return [Integer] - # *Optional* - # If set, specifies the estimated number of speakers in the conversation. - # If not set, defaults to '2'. - # Ignored unless enable_speaker_diarization is set to true." # @!attribute [rw] metadata # @return [Google::Cloud::Speech::V1p1beta1::RecognitionMetadata] # *Optional* Metadata regarding this request. # @!attribute [rw] model # @return [String] @@ -319,9 +324,29 @@ # kbps). When using this encoding, `sample_rate_hertz` can be optionally # unset if not known. MP3 = 8 end end + + # *Optional* Config to enable speaker diarization. + # @!attribute [rw] enable_speaker_diarization + # @return [true, false] + # *Optional* If 'true', enables speaker detection for each recognized word in + # the top alternative of the recognition result using a speaker_tag provided + # in the WordInfo. + # @!attribute [rw] min_speaker_count + # @return [Integer] + # *Optional* + # Minimum number of speakers in the conversation. This range gives you more + # flexibility by allowing the system to automatically determine the correct + # number of speakers. If not set, the default value is 2. + # @!attribute [rw] max_speaker_count + # @return [Integer] + # *Optional* + # Maximum number of speakers in the conversation. This range gives you more + # flexibility by allowing the system to automatically determine the correct + # number of speakers. If not set, the default value is 6. + class SpeakerDiarizationConfig; end # Description of audio data to be recognized. # @!attribute [rw] interaction_type # @return [Google::Cloud::Speech::V1p1beta1::RecognitionMetadata::InteractionType] # The use case most closely describing the audio content to be recognized. \ No newline at end of file