|
212 | 212 | }
|
213 | 213 | }
|
214 | 214 | },
|
215 |
| - "revision": "20210924", |
| 215 | + "revision": "20210929", |
216 | 216 | "rootUrl": "https://speech.googleapis.com/",
|
217 | 217 | "schemas": {
|
218 | 218 | "ListOperationsResponse": {
|
|
283 | 283 | "description": "The only message returned to the client by the `LongRunningRecognize` method. It contains the result as zero or more sequential `SpeechRecognitionResult` messages. It is included in the `result.response` field of the `Operation` returned by the `GetOperation` call of the `google::longrunning::Operations` service.",
|
284 | 284 | "id": "LongRunningRecognizeResponse",
|
285 | 285 | "properties": {
|
| 286 | + "outputConfig": { |
| 287 | + "$ref": "TranscriptOutputConfig", |
| 288 | + "description": "Original output config if present in the request." |
| 289 | + }, |
| 290 | + "outputError": { |
| 291 | + "$ref": "Status", |
| 292 | + "description": "If the transcript output fails this field contains the relevant error." |
| 293 | + }, |
286 | 294 | "results": {
|
287 | 295 | "description": "Sequential list of transcription results corresponding to sequential portions of audio.",
|
288 | 296 | "items": {
|
|
384 | 392 | "AMR",
|
385 | 393 | "AMR_WB",
|
386 | 394 | "OGG_OPUS",
|
387 |
| - "SPEEX_WITH_HEADER_BYTE" |
| 395 | + "SPEEX_WITH_HEADER_BYTE", |
| 396 | + "WEBM_OPUS" |
388 | 397 | ],
|
389 | 398 | "enumDescriptions": [
|
390 | 399 | "Not specified.",
|
|
394 | 403 | "Adaptive Multi-Rate Narrowband codec. `sample_rate_hertz` must be 8000.",
|
395 | 404 | "Adaptive Multi-Rate Wideband codec. `sample_rate_hertz` must be 16000.",
|
396 | 405 | "Opus encoded audio frames in Ogg container ([OggOpus](https://wiki.xiph.org/OggOpus)). `sample_rate_hertz` must be one of 8000, 12000, 16000, 24000, or 48000.",
|
397 |
| - "Although the use of lossy encodings is not recommended, if a very low bitrate encoding is required, `OGG_OPUS` is highly preferred over Speex encoding. The [Speex](https://speex.org/) encoding supported by Cloud Speech API has a header byte in each block, as in MIME type `audio/x-speex-with-header-byte`. It is a variant of the RTP Speex encoding defined in [RFC 5574](https://tools.ietf.org/html/rfc5574). The stream is a sequence of blocks, one block per RTP packet. Each block starts with a byte containing the length of the block, in bytes, followed by one or more frames of Speex data, padded to an integral number of bytes (octets) as specified in RFC 5574. In other words, each RTP header is replaced with a single byte containing the block length. Only Speex wideband is supported. `sample_rate_hertz` must be 16000." |
| 406 | + "Although the use of lossy encodings is not recommended, if a very low bitrate encoding is required, `OGG_OPUS` is highly preferred over Speex encoding. The [Speex](https://speex.org/) encoding supported by Cloud Speech API has a header byte in each block, as in MIME type `audio/x-speex-with-header-byte`. It is a variant of the RTP Speex encoding defined in [RFC 5574](https://tools.ietf.org/html/rfc5574). The stream is a sequence of blocks, one block per RTP packet. Each block starts with a byte containing the length of the block, in bytes, followed by one or more frames of Speex data, padded to an integral number of bytes (octets) as specified in RFC 5574. In other words, each RTP header is replaced with a single byte containing the block length. Only Speex wideband is supported. `sample_rate_hertz` must be 16000.", |
| 407 | + "Opus encoded audio frames in WebM container ([OggOpus](https://wiki.xiph.org/OggOpus)). This is a Beta features and only available in v1p1beta1. `sample_rate_hertz` must be one of 8000, 12000, 16000, 24000, or 48000." |
398 | 408 | ],
|
399 | 409 | "type": "string"
|
400 | 410 | },
|
|
0 commit comments