googleapis
diff --git a/‎packages/google-cloud-texttospeech/protos/google/cloud/texttospeech/v1beta1/cloud_tts.proto‎
Lines changed: 20 additions & 0 deletions b/‎packages/google-cloud-texttospeech/protos/google/cloud/texttospeech/v1beta1/cloud_tts.proto‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎packages/google-cloud-texttospeech/protos/protos.d.ts‎
Lines changed: 111 additions & 1 deletion b/‎packages/google-cloud-texttospeech/protos/protos.d.ts‎
Lines changed: 111 additions & 1 deletion
@@ -115,6 +115,11 @@ enum AudioEncoding {
   // 8-bit samples that compand 14-bit audio samples using G.711 PCMU/A-law.
   // Audio content returned as ALAW also contains a WAV header.
   ALAW = 6;
+
+  // Uncompressed 16-bit signed little-endian samples (Linear PCM).
+  // Note that as opposed to LINEAR16, audio will not be wrapped in a WAV (or
+  // any other) header.
+  PCM = 7;
 }
 
 // The top-level message sent by the client for the `ListVoices` method.
@@ -432,10 +437,25 @@ message Timepoint {
   double time_seconds = 3;
 }
 
+// Description of the desired output audio data.
+message StreamingAudioConfig {
+  // Required. The format of the audio byte stream.
+  // For now, streaming only supports PCM and OGG_OPUS. All other encodings
+  // will return an error.
+  AudioEncoding audio_encoding = 1 [(google.api.field_behavior) = REQUIRED];
+
+  // Optional. The synthesis sample rate (in hertz) for this audio.
+  int32 sample_rate_hertz = 2 [(google.api.field_behavior) = OPTIONAL];
+}
+
 // Provides configuration information for the StreamingSynthesize request.
 message StreamingSynthesizeConfig {
   // Required. The desired voice of the synthesized audio.
   VoiceSelectionParams voice = 1 [(google.api.field_behavior) = REQUIRED];
+
+  // Optional. The configuration of the synthesized audio.
+  StreamingAudioConfig streaming_audio_config = 4
+      [(google.api.field_behavior) = OPTIONAL];
 }
 
 // Input to be synthesized.