@@ -32,7 +32,9 @@ export interface Session {
32
32
id ?: string ;
33
33
34
34
/**
35
- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
35
+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
36
+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
37
+ * (mono), and little-endian byte order.
36
38
*/
37
39
input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
38
40
@@ -86,6 +88,7 @@ export interface Session {
86
88
87
89
/**
88
90
* The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
91
+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
89
92
*/
90
93
output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
91
94
@@ -372,17 +375,9 @@ export namespace SessionCreateResponse {
372
375
373
376
export interface SessionCreateParams {
374
377
/**
375
- * The Realtime model used for this session.
376
- */
377
- model :
378
- | 'gpt-4o-realtime-preview'
379
- | 'gpt-4o-realtime-preview-2024-10-01'
380
- | 'gpt-4o-realtime-preview-2024-12-17'
381
- | 'gpt-4o-mini-realtime-preview'
382
- | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
383
-
384
- /**
385
- * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
378
+ * The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`. For
379
+ * `pcm16`, input audio must be 16-bit PCM at a 24kHz sample rate, single channel
380
+ * (mono), and little-endian byte order.
386
381
*/
387
382
input_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
388
383
@@ -423,8 +418,19 @@ export interface SessionCreateParams {
423
418
*/
424
419
modalities ?: Array < 'text' | 'audio' > ;
425
420
421
+ /**
422
+ * The Realtime model used for this session.
423
+ */
424
+ model ?:
425
+ | 'gpt-4o-realtime-preview'
426
+ | 'gpt-4o-realtime-preview-2024-10-01'
427
+ | 'gpt-4o-realtime-preview-2024-12-17'
428
+ | 'gpt-4o-mini-realtime-preview'
429
+ | 'gpt-4o-mini-realtime-preview-2024-12-17' ;
430
+
426
431
/**
427
432
* The format of output audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
433
+ * For `pcm16`, output audio is sampled at a rate of 24kHz.
428
434
*/
429
435
output_audio_format ?: 'pcm16' | 'g711_ulaw' | 'g711_alaw' ;
430
436
0 commit comments