lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.34.1 vs lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb in google-cloud-speech-0.35.0
- old
+ new
@@ -319,10 +319,15 @@
# by one or more frames of Speex data, padded to an integral number of
# bytes (octets) as specified in RFC 5574. In other words, each RTP header
# is replaced with a single byte containing the block length. Only Speex
# wideband is supported. `sample_rate_hertz` must be 16000.
SPEEX_WITH_HEADER_BYTE = 7
+
+ # MP3 audio. Support all standard MP3 bitrates (which range from 32-320
+ # kbps). When using this encoding, `sample_rate_hertz` can be optionally
+ # unset if not known.
+ MP3 = 8
end
end
# Description of audio data to be recognized.
# @!attribute [rw] interaction_type
@@ -463,9 +468,25 @@
# the speech recognition is more likely to recognize them. This can be used
# to improve the accuracy for specific words and phrases, for example, if
# specific commands are typically spoken by the user. This can also be used
# to add additional words to the vocabulary of the recognizer. See
# [usage limits](https://cloud.google.com/speech-to-text/quotas#content).
+ #
+ # List items can also be set to classes for groups of words that represent
+ # common concepts that occur in natural language. For example, rather than
+ # providing phrase hints for every month of the year, using the $MONTH class
+ # improves the likelihood of correctly transcribing audio that includes
+ # months.
+ # @!attribute [rw] boost
+ # @return [Float]
+ # Hint Boost. Positive value will increase the probability that a specific
+ # phrase will be recognized over other similar sounding phrases. The higher
+ # the boost, the higher the chance of false positive recognition as well.
+ # Negative boost values would correspond to anti-biasing. Anti-biasing is not
+ # enabled, so negative boost will simply be ignored. Though `boost` can
+ # accept a wide range of positive values, most use cases are best served with
+ # values between 0 and 20. We recommend using a binary search approach to
+ # finding the optimal value for your use case.
class SpeechContext; end
# Contains audio data in the encoding specified in the `RecognitionConfig`.
# Either `content` or `uri` must be supplied. Supplying both or neither
# returns {Google::Rpc::Code::INVALID_ARGUMENT}.
\ No newline at end of file