lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.36.0 vs lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.37.0
- old
+ new
@@ -188,22 +188,27 @@
# @!attribute [rw] enable_speaker_diarization
# @return [true, false]
# *Optional* If 'true', enables speaker detection for each recognized word in
# the top alternative of the recognition result using a speaker_tag provided
# in the WordInfo.
- # Note: When this is true, we send all the words from the beginning of the
+ # Note: Use diarization_config instead.
+ # @!attribute [rw] diarization_speaker_count
+ # @return [Integer]
+ # *Optional*
+ # If set, specifies the estimated number of speakers in the conversation.
+ # Defaults to '2'. Ignored unless enable_speaker_diarization is set to true.
+ # Note: Use diarization_config instead.
+ # @!attribute [rw] diarization_config
+ # @return [Google::Cloud::Speech::V1p1beta1::SpeakerDiarizationConfig]
+ # *Optional* Config to enable speaker diarization and set additional
+ # parameters to make diarization better suited for your application.
+ # Note: When this is enabled, we send all the words from the beginning of the
# audio for the top alternative in every consecutive STREAMING responses.
# This is done in order to improve our speaker tags as our models learn to
# identify the speakers in the conversation over time.
# For non-streaming requests, the diarization results will be provided only
# in the top alternative of the FINAL SpeechRecognitionResult.
- # @!attribute [rw] diarization_speaker_count
- # @return [Integer]
- # *Optional*
- # If set, specifies the estimated number of speakers in the conversation.
- # If not set, defaults to '2'.
- # Ignored unless enable_speaker_diarization is set to true."
# @!attribute [rw] metadata
# @return [Google::Cloud::Speech::V1p1beta1::RecognitionMetadata]
# *Optional* Metadata regarding this request.
# @!attribute [rw] model
# @return [String]
@@ -319,9 +324,29 @@
# kbps). When using this encoding, `sample_rate_hertz` can be optionally
# unset if not known.
MP3 = 8
end
end
+
+ # *Optional* Config to enable speaker diarization.
+ # @!attribute [rw] enable_speaker_diarization
+ # @return [true, false]
+ # *Optional* If 'true', enables speaker detection for each recognized word in
+ # the top alternative of the recognition result using a speaker_tag provided
+ # in the WordInfo.
+ # @!attribute [rw] min_speaker_count
+ # @return [Integer]
+ # *Optional*
+ # Minimum number of speakers in the conversation. This range gives you more
+ # flexibility by allowing the system to automatically determine the correct
+ # number of speakers. If not set, the default value is 2.
+ # @!attribute [rw] max_speaker_count
+ # @return [Integer]
+ # *Optional*
+ # Maximum number of speakers in the conversation. This range gives you more
+ # flexibility by allowing the system to automatically determine the correct
+ # number of speakers. If not set, the default value is 6.
+ class SpeakerDiarizationConfig; end
# Description of audio data to be recognized.
# @!attribute [rw] interaction_type
# @return [Google::Cloud::Speech::V1p1beta1::RecognitionMetadata::InteractionType]
# The use case most closely describing the audio content to be recognized.
\ No newline at end of file