From e496559c17e00a1fb3989c6c38cb87a0453c5b29 Mon Sep 17 00:00:00 2001
From: Yoshi Automation Bot <yoshi-automation@google.com>
Date: Tue, 27 Apr 2021 12:10:16 -0700
Subject: [PATCH] feat: add webm opus support (#500)

This PR was generated using Autosynth. :rainbow:

Synth log will be available here:
https://source.cloud.google.com/results/invocations/c65c7773-dbef-42eb-b70e-47092f05bd1b/targets

- [ ] To automatically regenerate this PR, check this box. (May take up to 24 hours.)

PiperOrigin-RevId: 370523741
Source-Link: https://github.com/googleapis/googleapis/commit/36a84fe3eaf841f56c4b6683d1c0403f7b503092
---
 .../speech/v1p1beta1/RecognitionConfig.java   |  42 +++-
 .../v1p1beta1/RecognitionConfigOrBuilder.java |   4 +-
 .../cloud/speech/v1p1beta1/SpeechProto.java   | 191 +++++++++---------
 .../cloud/speech/v1p1beta1/cloud_speech.proto |   9 +-
 synth.metadata                                |  10 +-
 5 files changed, 145 insertions(+), 111 deletions(-)
diff --git a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfig.java b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfig.java
index 6a6aec931..1799127be 100644
--- a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfig.java
+++ b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfig.java
@@ -435,6 +435,19 @@ public enum AudioEncoding implements com.google.protobuf.ProtocolMessageEnum {
      * <code>MP3 = 8;</code>
      */
     MP3(8),
+    /**
+     *
+     *
+     * <pre>
+     * Opus encoded audio frames in WebM container
+     * ([OggOpus](https://wiki.xiph.org/OggOpus)). This is a Beta features and
+     * only available in v1p1beta1. `sample_rate_hertz` must be one of 8000,
+     * 12000, 16000, 24000, or 48000.
+     * </pre>
+     *
+     * <code>WEBM_OPUS = 9;</code>
+     */
+    WEBM_OPUS(9),
     UNRECOGNIZED(-1),
     ;
 
@@ -550,6 +563,19 @@ public enum AudioEncoding implements com.google.protobuf.ProtocolMessageEnum {
      * <code>MP3 = 8;</code>
      */
     public static final int MP3_VALUE = 8;
+    /**
+     *
+     *
+     * <pre>
+     * Opus encoded audio frames in WebM container
+     * ([OggOpus](https://wiki.xiph.org/OggOpus)). This is a Beta features and
+     * only available in v1p1beta1. `sample_rate_hertz` must be one of 8000,
+     * 12000, 16000, 24000, or 48000.
+     * </pre>
+     *
+     * <code>WEBM_OPUS = 9;</code>
+     */
+    public static final int WEBM_OPUS_VALUE = 9;
 
     public final int getNumber() {
       if (this == UNRECOGNIZED) {
@@ -593,6 +619,8 @@ public static AudioEncoding forNumber(int value) {
           return SPEEX_WITH_HEADER_BYTE;
         case 8:
           return MP3;
+        case 9:
+          return WEBM_OPUS;
         default:
           return null;
       }
@@ -1496,7 +1524,7 @@ public com.google.cloud.speech.v1p1beta1.RecognitionMetadataOrBuilder getMetadat
    *   &lt;/tr&gt;
    *   &lt;tr&gt;
    *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-   *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+   *     &lt;td&gt;Best for audio that originated from video or includes multiple
    *         speakers. Ideally the audio is recorded at a 16khz or greater
    *         sampling rate. This is a premium model that costs more than the
    *         standard rate.&lt;/td&gt;
@@ -1550,7 +1578,7 @@ public java.lang.String getModel() {
    *   &lt;/tr&gt;
    *   &lt;tr&gt;
    *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-   *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+   *     &lt;td&gt;Best for audio that originated from video or includes multiple
    *         speakers. Ideally the audio is recorded at a 16khz or greater
    *         sampling rate. This is a premium model that costs more than the
    *         standard rate.&lt;/td&gt;
@@ -5094,7 +5122,7 @@ public com.google.cloud.speech.v1p1beta1.RecognitionMetadataOrBuilder getMetadat
      *   &lt;/tr&gt;
      *   &lt;tr&gt;
      *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-     *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+     *     &lt;td&gt;Best for audio that originated from video or includes multiple
      *         speakers. Ideally the audio is recorded at a 16khz or greater
      *         sampling rate. This is a premium model that costs more than the
      *         standard rate.&lt;/td&gt;
@@ -5147,7 +5175,7 @@ public java.lang.String getModel() {
      *   &lt;/tr&gt;
      *   &lt;tr&gt;
      *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-     *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+     *     &lt;td&gt;Best for audio that originated from video or includes multiple
      *         speakers. Ideally the audio is recorded at a 16khz or greater
      *         sampling rate. This is a premium model that costs more than the
      *         standard rate.&lt;/td&gt;
@@ -5200,7 +5228,7 @@ public com.google.protobuf.ByteString getModelBytes() {
      *   &lt;/tr&gt;
      *   &lt;tr&gt;
      *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-     *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+     *     &lt;td&gt;Best for audio that originated from video or includes multiple
      *         speakers. Ideally the audio is recorded at a 16khz or greater
      *         sampling rate. This is a premium model that costs more than the
      *         standard rate.&lt;/td&gt;
@@ -5252,7 +5280,7 @@ public Builder setModel(java.lang.String value) {
      *   &lt;/tr&gt;
      *   &lt;tr&gt;
      *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-     *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+     *     &lt;td&gt;Best for audio that originated from video or includes multiple
      *         speakers. Ideally the audio is recorded at a 16khz or greater
      *         sampling rate. This is a premium model that costs more than the
      *         standard rate.&lt;/td&gt;
@@ -5300,7 +5328,7 @@ public Builder clearModel() {
      *   &lt;/tr&gt;
      *   &lt;tr&gt;
      *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-     *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+     *     &lt;td&gt;Best for audio that originated from video or includes multiple
      *         speakers. Ideally the audio is recorded at a 16khz or greater
      *         sampling rate. This is a premium model that costs more than the
      *         standard rate.&lt;/td&gt;
diff --git a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfigOrBuilder.java b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfigOrBuilder.java
index 2502f4b4f..99350d004 100644
--- a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfigOrBuilder.java
+++ b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/RecognitionConfigOrBuilder.java
@@ -689,7 +689,7 @@ public interface RecognitionConfigOrBuilder
    *   &lt;/tr&gt;
    *   &lt;tr&gt;
    *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-   *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+   *     &lt;td&gt;Best for audio that originated from video or includes multiple
    *         speakers. Ideally the audio is recorded at a 16khz or greater
    *         sampling rate. This is a premium model that costs more than the
    *         standard rate.&lt;/td&gt;
@@ -732,7 +732,7 @@ public interface RecognitionConfigOrBuilder
    *   &lt;/tr&gt;
    *   &lt;tr&gt;
    *     &lt;td&gt;&lt;code&gt;video&lt;/code&gt;&lt;/td&gt;
-   *     &lt;td&gt;Best for audio that originated from from video or includes multiple
+   *     &lt;td&gt;Best for audio that originated from video or includes multiple
    *         speakers. Ideally the audio is recorded at a 16khz or greater
    *         sampling rate. This is a premium model that costs more than the
    *         standard rate.&lt;/td&gt;
diff --git a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/SpeechProto.java b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/SpeechProto.java
index 41f71dbcd..18d17f440 100644
--- a/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/SpeechProto.java
+++ b/proto-google-cloud-speech-v1p1beta1/src/main/java/com/google/cloud/speech/v1p1beta1/SpeechProto.java
@@ -137,7 +137,7 @@ public static com.google.protobuf.Descriptors.FileDescriptor getDescriptor() {
           + "\"\226\001\n\032StreamingRecognitionConfig\022E\n\006confi"
           + "g\030\001 \001(\01320.google.cloud.speech.v1p1beta1."
           + "RecognitionConfigB\003\340A\002\022\030\n\020single_utteran"
-          + "ce\030\002 \001(\010\022\027\n\017interim_results\030\003 \001(\010\"\325\010\n\021Re"
+          + "ce\030\002 \001(\010\022\027\n\017interim_results\030\003 \001(\010\"\344\010\n\021Re"
           + "cognitionConfig\022P\n\010encoding\030\001 \001(\0162>.goog"
           + "le.cloud.speech.v1p1beta1.RecognitionCon"
           + "fig.AudioEncoding\022\031\n\021sample_rate_hertz\030\002"
@@ -161,105 +161,106 @@ public static com.google.protobuf.Descriptors.FileDescriptor getDescriptor() {
           + "cloud.speech.v1p1beta1.SpeakerDiarizatio"
           + "nConfig\022D\n\010metadata\030\t \001(\01322.google.cloud"
           + ".speech.v1p1beta1.RecognitionMetadata\022\r\n"
-          + "\005model\030\r \001(\t\022\024\n\014use_enhanced\030\016 \001(\010\"\224\001\n\rA"
+          + "\005model\030\r \001(\t\022\024\n\014use_enhanced\030\016 \001(\010\"\243\001\n\rA"
           + "udioEncoding\022\030\n\024ENCODING_UNSPECIFIED\020\000\022\014"
           + "\n\010LINEAR16\020\001\022\010\n\004FLAC\020\002\022\t\n\005MULAW\020\003\022\007\n\003AMR"
           + "\020\004\022\n\n\006AMR_WB\020\005\022\014\n\010OGG_OPUS\020\006\022\032\n\026SPEEX_WI"
-          + "TH_HEADER_BYTE\020\007\022\007\n\003MP3\020\010\"\220\001\n\030SpeakerDia"
-          + "rizationConfig\022\"\n\032enable_speaker_diariza"
-          + "tion\030\001 \001(\010\022\031\n\021min_speaker_count\030\002 \001(\005\022\031\n"
-          + "\021max_speaker_count\030\003 \001(\005\022\032\n\013speaker_tag\030"
-          + "\005 \001(\005B\005\030\001\340A\003\"\327\010\n\023RecognitionMetadata\022\\\n\020"
-          + "interaction_type\030\001 \001(\0162B.google.cloud.sp"
-          + "eech.v1p1beta1.RecognitionMetadata.Inter"
-          + "actionType\022$\n\034industry_naics_code_of_aud"
-          + "io\030\003 \001(\r\022b\n\023microphone_distance\030\004 \001(\0162E."
+          + "TH_HEADER_BYTE\020\007\022\007\n\003MP3\020\010\022\r\n\tWEBM_OPUS\020\t"
+          + "\"\220\001\n\030SpeakerDiarizationConfig\022\"\n\032enable_"
+          + "speaker_diarization\030\001 \001(\010\022\031\n\021min_speaker"
+          + "_count\030\002 \001(\005\022\031\n\021max_speaker_count\030\003 \001(\005\022"
+          + "\032\n\013speaker_tag\030\005 \001(\005B\005\030\001\340A\003\"\327\010\n\023Recognit"
+          + "ionMetadata\022\\\n\020interaction_type\030\001 \001(\0162B."
           + "google.cloud.speech.v1p1beta1.Recognitio"
-          + "nMetadata.MicrophoneDistance\022a\n\023original"
-          + "_media_type\030\005 \001(\0162D.google.cloud.speech."
-          + "v1p1beta1.RecognitionMetadata.OriginalMe"
-          + "diaType\022e\n\025recording_device_type\030\006 \001(\0162F"
-          + ".google.cloud.speech.v1p1beta1.Recogniti"
-          + "onMetadata.RecordingDeviceType\022\035\n\025record"
-          + "ing_device_name\030\007 \001(\t\022\032\n\022original_mime_t"
-          + "ype\030\010 \001(\t\022\031\n\robfuscated_id\030\t \001(\003B\002\030\001\022\023\n\013"
-          + "audio_topic\030\n \001(\t\"\305\001\n\017InteractionType\022 \n"
-          + "\034INTERACTION_TYPE_UNSPECIFIED\020\000\022\016\n\nDISCU"
-          + "SSION\020\001\022\020\n\014PRESENTATION\020\002\022\016\n\nPHONE_CALL\020"
-          + "\003\022\r\n\tVOICEMAIL\020\004\022\033\n\027PROFESSIONALLY_PRODU"
-          + "CED\020\005\022\020\n\014VOICE_SEARCH\020\006\022\021\n\rVOICE_COMMAND"
-          + "\020\007\022\r\n\tDICTATION\020\010\"d\n\022MicrophoneDistance\022"
-          + "#\n\037MICROPHONE_DISTANCE_UNSPECIFIED\020\000\022\r\n\t"
-          + "NEARFIELD\020\001\022\014\n\010MIDFIELD\020\002\022\014\n\010FARFIELD\020\003\""
-          + "N\n\021OriginalMediaType\022#\n\037ORIGINAL_MEDIA_T"
-          + "YPE_UNSPECIFIED\020\000\022\t\n\005AUDIO\020\001\022\t\n\005VIDEO\020\002\""
-          + "\244\001\n\023RecordingDeviceType\022%\n!RECORDING_DEV"
-          + "ICE_TYPE_UNSPECIFIED\020\000\022\016\n\nSMARTPHONE\020\001\022\006"
-          + "\n\002PC\020\002\022\016\n\nPHONE_LINE\020\003\022\013\n\007VEHICLE\020\004\022\030\n\024O"
-          + "THER_OUTDOOR_DEVICE\020\005\022\027\n\023OTHER_INDOOR_DE"
-          + "VICE\020\006\"/\n\rSpeechContext\022\017\n\007phrases\030\001 \003(\t"
-          + "\022\r\n\005boost\030\004 \001(\002\"D\n\020RecognitionAudio\022\021\n\007c"
-          + "ontent\030\001 \001(\014H\000\022\r\n\003uri\030\002 \001(\tH\000B\016\n\014audio_s"
-          + "ource\"\\\n\021RecognizeResponse\022G\n\007results\030\002 "
-          + "\003(\01326.google.cloud.speech.v1p1beta1.Spee"
-          + "chRecognitionResult\"\337\001\n\034LongRunningRecog"
-          + "nizeResponse\022G\n\007results\030\002 \003(\01326.google.c"
-          + "loud.speech.v1p1beta1.SpeechRecognitionR"
-          + "esult\022L\n\routput_config\030\006 \001(\01325.google.cl"
-          + "oud.speech.v1p1beta1.TranscriptOutputCon"
-          + "fig\022(\n\014output_error\030\007 \001(\0132\022.google.rpc.S"
-          + "tatus\"\203\002\n\034LongRunningRecognizeMetadata\022\030"
-          + "\n\020progress_percent\030\001 \001(\005\022.\n\nstart_time\030\002"
-          + " \001(\0132\032.google.protobuf.Timestamp\0224\n\020last"
-          + "_update_time\030\003 \001(\0132\032.google.protobuf.Tim"
-          + "estamp\022\020\n\003uri\030\004 \001(\tB\003\340A\003\022Q\n\routput_confi"
-          + "g\030\005 \001(\01325.google.cloud.speech.v1p1beta1."
-          + "TranscriptOutputConfigB\003\340A\003\"\277\002\n\032Streamin"
-          + "gRecognizeResponse\022!\n\005error\030\001 \001(\0132\022.goog"
-          + "le.rpc.Status\022J\n\007results\030\002 \003(\01329.google."
-          + "cloud.speech.v1p1beta1.StreamingRecognit"
-          + "ionResult\022d\n\021speech_event_type\030\004 \001(\0162I.g"
+          + "nMetadata.InteractionType\022$\n\034industry_na"
+          + "ics_code_of_audio\030\003 \001(\r\022b\n\023microphone_di"
+          + "stance\030\004 \001(\0162E.google.cloud.speech.v1p1b"
+          + "eta1.RecognitionMetadata.MicrophoneDista"
+          + "nce\022a\n\023original_media_type\030\005 \001(\0162D.googl"
+          + "e.cloud.speech.v1p1beta1.RecognitionMeta"
+          + "data.OriginalMediaType\022e\n\025recording_devi"
+          + "ce_type\030\006 \001(\0162F.google.cloud.speech.v1p1"
+          + "beta1.RecognitionMetadata.RecordingDevic"
+          + "eType\022\035\n\025recording_device_name\030\007 \001(\t\022\032\n\022"
+          + "original_mime_type\030\010 \001(\t\022\031\n\robfuscated_i"
+          + "d\030\t \001(\003B\002\030\001\022\023\n\013audio_topic\030\n \001(\t\"\305\001\n\017Int"
+          + "eractionType\022 \n\034INTERACTION_TYPE_UNSPECI"
+          + "FIED\020\000\022\016\n\nDISCUSSION\020\001\022\020\n\014PRESENTATION\020\002"
+          + "\022\016\n\nPHONE_CALL\020\003\022\r\n\tVOICEMAIL\020\004\022\033\n\027PROFE"
+          + "SSIONALLY_PRODUCED\020\005\022\020\n\014VOICE_SEARCH\020\006\022\021"
+          + "\n\rVOICE_COMMAND\020\007\022\r\n\tDICTATION\020\010\"d\n\022Micr"
+          + "ophoneDistance\022#\n\037MICROPHONE_DISTANCE_UN"
+          + "SPECIFIED\020\000\022\r\n\tNEARFIELD\020\001\022\014\n\010MIDFIELD\020\002"
+          + "\022\014\n\010FARFIELD\020\003\"N\n\021OriginalMediaType\022#\n\037O"
+          + "RIGINAL_MEDIA_TYPE_UNSPECIFIED\020\000\022\t\n\005AUDI"
+          + "O\020\001\022\t\n\005VIDEO\020\002\"\244\001\n\023RecordingDeviceType\022%"
+          + "\n!RECORDING_DEVICE_TYPE_UNSPECIFIED\020\000\022\016\n"
+          + "\nSMARTPHONE\020\001\022\006\n\002PC\020\002\022\016\n\nPHONE_LINE\020\003\022\013\n"
+          + "\007VEHICLE\020\004\022\030\n\024OTHER_OUTDOOR_DEVICE\020\005\022\027\n\023"
+          + "OTHER_INDOOR_DEVICE\020\006\"/\n\rSpeechContext\022\017"
+          + "\n\007phrases\030\001 \003(\t\022\r\n\005boost\030\004 \001(\002\"D\n\020Recogn"
+          + "itionAudio\022\021\n\007content\030\001 \001(\014H\000\022\r\n\003uri\030\002 \001"
+          + "(\tH\000B\016\n\014audio_source\"\\\n\021RecognizeRespons"
+          + "e\022G\n\007results\030\002 \003(\01326.google.cloud.speech"
+          + ".v1p1beta1.SpeechRecognitionResult\"\337\001\n\034L"
+          + "ongRunningRecognizeResponse\022G\n\007results\030\002"
+          + " \003(\01326.google.cloud.speech.v1p1beta1.Spe"
+          + "echRecognitionResult\022L\n\routput_config\030\006 "
+          + "\001(\01325.google.cloud.speech.v1p1beta1.Tran"
+          + "scriptOutputConfig\022(\n\014output_error\030\007 \001(\013"
+          + "2\022.google.rpc.Status\"\203\002\n\034LongRunningReco"
+          + "gnizeMetadata\022\030\n\020progress_percent\030\001 \001(\005\022"
+          + ".\n\nstart_time\030\002 \001(\0132\032.google.protobuf.Ti"
+          + "mestamp\0224\n\020last_update_time\030\003 \001(\0132\032.goog"
+          + "le.protobuf.Timestamp\022\020\n\003uri\030\004 \001(\tB\003\340A\003\022"
+          + "Q\n\routput_config\030\005 \001(\01325.google.cloud.sp"
+          + "eech.v1p1beta1.TranscriptOutputConfigB\003\340"
+          + "A\003\"\277\002\n\032StreamingRecognizeResponse\022!\n\005err"
+          + "or\030\001 \001(\0132\022.google.rpc.Status\022J\n\007results\030"
+          + "\002 \003(\01329.google.cloud.speech.v1p1beta1.St"
+          + "reamingRecognitionResult\022d\n\021speech_event"
+          + "_type\030\004 \001(\0162I.google.cloud.speech.v1p1be"
+          + "ta1.StreamingRecognizeResponse.SpeechEve"
+          + "ntType\"L\n\017SpeechEventType\022\034\n\030SPEECH_EVEN"
+          + "T_UNSPECIFIED\020\000\022\033\n\027END_OF_SINGLE_UTTERAN"
+          + "CE\020\001\"\371\001\n\032StreamingRecognitionResult\022Q\n\014a"
+          + "lternatives\030\001 \003(\0132;.google.cloud.speech."
+          + "v1p1beta1.SpeechRecognitionAlternative\022\020"
+          + "\n\010is_final\030\002 \001(\010\022\021\n\tstability\030\003 \001(\002\0222\n\017r"
+          + "esult_end_time\030\004 \001(\0132\031.google.protobuf.D"
+          + "uration\022\023\n\013channel_tag\030\005 \001(\005\022\032\n\rlanguage"
+          + "_code\030\006 \001(\tB\003\340A\003\"\235\001\n\027SpeechRecognitionRe"
+          + "sult\022Q\n\014alternatives\030\001 \003(\0132;.google.clou"
+          + "d.speech.v1p1beta1.SpeechRecognitionAlte"
+          + "rnative\022\023\n\013channel_tag\030\002 \001(\005\022\032\n\rlanguage"
+          + "_code\030\005 \001(\tB\003\340A\003\"~\n\034SpeechRecognitionAlt"
+          + "ernative\022\022\n\ntranscript\030\001 \001(\t\022\022\n\nconfiden"
+          + "ce\030\002 \001(\002\0226\n\005words\030\003 \003(\0132\'.google.cloud.s"
+          + "peech.v1p1beta1.WordInfo\"\242\001\n\010WordInfo\022-\n"
+          + "\nstart_time\030\001 \001(\0132\031.google.protobuf.Dura"
+          + "tion\022+\n\010end_time\030\002 \001(\0132\031.google.protobuf"
+          + ".Duration\022\014\n\004word\030\003 \001(\t\022\022\n\nconfidence\030\004 "
+          + "\001(\002\022\030\n\013speaker_tag\030\005 \001(\005B\003\340A\0032\202\005\n\006Speech"
+          + "\022\245\001\n\tRecognize\022/.google.cloud.speech.v1p"
+          + "1beta1.RecognizeRequest\0320.google.cloud.s"
+          + "peech.v1p1beta1.RecognizeResponse\"5\202\323\344\223\002"
+          + " \"\033/v1p1beta1/speech:recognize:\001*\332A\014conf"
+          + "ig,audio\022\362\001\n\024LongRunningRecognize\022:.goog"
+          + "le.cloud.speech.v1p1beta1.LongRunningRec"
+          + "ognizeRequest\032\035.google.longrunning.Opera"
+          + "tion\"\177\202\323\344\223\002+\"&/v1p1beta1/speech:longrunn"
+          + "ingrecognize:\001*\332A\014config,audio\312A<\n\034LongR"
+          + "unningRecognizeResponse\022\034LongRunningReco"
+          + "gnizeMetadata\022\217\001\n\022StreamingRecognize\0228.g"
           + "oogle.cloud.speech.v1p1beta1.StreamingRe"
-          + "cognizeResponse.SpeechEventType\"L\n\017Speec"
-          + "hEventType\022\034\n\030SPEECH_EVENT_UNSPECIFIED\020\000"
-          + "\022\033\n\027END_OF_SINGLE_UTTERANCE\020\001\"\371\001\n\032Stream"
-          + "ingRecognitionResult\022Q\n\014alternatives\030\001 \003"
-          + "(\0132;.google.cloud.speech.v1p1beta1.Speec"
-          + "hRecognitionAlternative\022\020\n\010is_final\030\002 \001("
-          + "\010\022\021\n\tstability\030\003 \001(\002\0222\n\017result_end_time\030"
-          + "\004 \001(\0132\031.google.protobuf.Duration\022\023\n\013chan"
-          + "nel_tag\030\005 \001(\005\022\032\n\rlanguage_code\030\006 \001(\tB\003\340A"
-          + "\003\"\235\001\n\027SpeechRecognitionResult\022Q\n\014alterna"
-          + "tives\030\001 \003(\0132;.google.cloud.speech.v1p1be"
-          + "ta1.SpeechRecognitionAlternative\022\023\n\013chan"
-          + "nel_tag\030\002 \001(\005\022\032\n\rlanguage_code\030\005 \001(\tB\003\340A"
-          + "\003\"~\n\034SpeechRecognitionAlternative\022\022\n\ntra"
-          + "nscript\030\001 \001(\t\022\022\n\nconfidence\030\002 \001(\002\0226\n\005wor"
-          + "ds\030\003 \003(\0132\'.google.cloud.speech.v1p1beta1"
-          + ".WordInfo\"\242\001\n\010WordInfo\022-\n\nstart_time\030\001 \001"
-          + "(\0132\031.google.protobuf.Duration\022+\n\010end_tim"
-          + "e\030\002 \001(\0132\031.google.protobuf.Duration\022\014\n\004wo"
-          + "rd\030\003 \001(\t\022\022\n\nconfidence\030\004 \001(\002\022\030\n\013speaker_"
-          + "tag\030\005 \001(\005B\003\340A\0032\202\005\n\006Speech\022\245\001\n\tRecognize\022"
-          + "/.google.cloud.speech.v1p1beta1.Recogniz"
-          + "eRequest\0320.google.cloud.speech.v1p1beta1"
-          + ".RecognizeResponse\"5\202\323\344\223\002 \"\033/v1p1beta1/s"
-          + "peech:recognize:\001*\332A\014config,audio\022\362\001\n\024Lo"
-          + "ngRunningRecognize\022:.google.cloud.speech"
-          + ".v1p1beta1.LongRunningRecognizeRequest\032\035"
-          + ".google.longrunning.Operation\"\177\202\323\344\223\002+\"&/"
-          + "v1p1beta1/speech:longrunningrecognize:\001*"
-          + "\332A\014config,audio\312A<\n\034LongRunningRecognize"
-          + "Response\022\034LongRunningRecognizeMetadata\022\217"
-          + "\001\n\022StreamingRecognize\0228.google.cloud.spe"
-          + "ech.v1p1beta1.StreamingRecognizeRequest\032"
-          + "9.google.cloud.speech.v1p1beta1.Streamin"
-          + "gRecognizeResponse\"\000(\0010\001\032I\312A\025speech.goog"
-          + "leapis.com\322A.https://www.googleapis.com/"
-          + "auth/cloud-platformB\200\001\n!com.google.cloud"
-          + ".speech.v1p1beta1B\013SpeechProtoP\001ZCgoogle"
-          + ".golang.org/genproto/googleapis/cloud/sp"
-          + "eech/v1p1beta1;speech\370\001\001\242\002\003GCSb\006proto3"
+          + "cognizeRequest\0329.google.cloud.speech.v1p"
+          + "1beta1.StreamingRecognizeResponse\"\000(\0010\001\032"
+          + "I\312A\025speech.googleapis.com\322A.https://www."
+          + "googleapis.com/auth/cloud-platformB\200\001\n!c"
+          + "om.google.cloud.speech.v1p1beta1B\013Speech"
+          + "ProtoP\001ZCgoogle.golang.org/genproto/goog"
+          + "leapis/cloud/speech/v1p1beta1;speech\370\001\001\242"
+          + "\002\003GCSb\006proto3"
     };
     descriptor =
         com.google.protobuf.Descriptors.FileDescriptor.internalBuildGeneratedFileFrom(
diff --git a/proto-google-cloud-speech-v1p1beta1/src/main/proto/google/cloud/speech/v1p1beta1/cloud_speech.proto b/proto-google-cloud-speech-v1p1beta1/src/main/proto/google/cloud/speech/v1p1beta1/cloud_speech.proto
index cf183d012..1deb3c7cf 100644
--- a/proto-google-cloud-speech-v1p1beta1/src/main/proto/google/cloud/speech/v1p1beta1/cloud_speech.proto
+++ b/proto-google-cloud-speech-v1p1beta1/src/main/proto/google/cloud/speech/v1p1beta1/cloud_speech.proto
@@ -1,4 +1,3 @@
-
 // Copyright 2021 Google LLC
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
@@ -244,6 +243,12 @@ message RecognitionConfig {
     // kbps). When using this encoding, `sample_rate_hertz` has to match the
     // sample rate of the file being used.
     MP3 = 8;
+
+    // Opus encoded audio frames in WebM container
+    // ([OggOpus](https://wiki.xiph.org/OggOpus)). This is a Beta features and
+    // only available in v1p1beta1. `sample_rate_hertz` must be one of 8000,
+    // 12000, 16000, 24000, or 48000.
+    WEBM_OPUS = 9;
   }
 
   // Encoding of audio data sent in all `RecognitionAudio` messages.
@@ -406,7 +411,7 @@ message RecognitionConfig {
   //   </tr>
   //   <tr>
   //     <td><code>video</code></td>
-  //     <td>Best for audio that originated from from video or includes multiple
+  //     <td>Best for audio that originated from video or includes multiple
   //         speakers. Ideally the audio is recorded at a 16khz or greater
   //         sampling rate. This is a premium model that costs more than the
   //         standard rate.</td>
diff --git a/synth.metadata b/synth.metadata
index 2c754a4d9..84e1e5825 100644
--- a/synth.metadata
+++ b/synth.metadata
@@ -4,23 +4,23 @@
       "git": {
         "name": ".",
         "remote": "https://github.com/googleapis/java-speech.git",
-        "sha": "c812cb7783186186061f01fa65c752162df8dc81"
+        "sha": "4530ef98a4d5dbe9def59fdd26c6e2ee37041763"
       }
     },
     {
       "git": {
         "name": "googleapis",
         "remote": "https://github.com/googleapis/googleapis.git",
-        "sha": "93b078ae0decd51e618041bb337a8d592d0c998b",
-        "internalRef": "367239272"
+        "sha": "36a84fe3eaf841f56c4b6683d1c0403f7b503092",
+        "internalRef": "370523741"
       }
     },
     {
       "git": {
         "name": "googleapis",
         "remote": "https://github.com/googleapis/googleapis.git",
-        "sha": "93b078ae0decd51e618041bb337a8d592d0c998b",
-        "internalRef": "367239272"
+        "sha": "36a84fe3eaf841f56c4b6683d1c0403f7b503092",
+        "internalRef": "370523741"
       }
     },
     {