You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
"The websockets package is required for realtime speech-to-text. "
@@ -17,10 +20,13 @@
17
20
18
21
classAudioFormat(str, Enum):
19
22
"""Audio format options for realtime transcription"""
23
+
PCM_8000="pcm_8000"
20
24
PCM_16000="pcm_16000"
21
25
PCM_22050="pcm_22050"
22
26
PCM_24000="pcm_24000"
23
27
PCM_44100="pcm_44100"
28
+
PCM_48000="pcm_48000"
29
+
ULAW_8000="ulaw_8000"
24
30
25
31
26
32
classCommitStrategy(str, Enum):
@@ -50,9 +56,9 @@ class RealtimeAudioOptions(typing.TypedDict, total=False):
50
56
language_code: An ISO-639-1 or ISO-639-3 language_code corresponding to the language of the audio file. Can sometimes improve transcription performance if known beforehand.
51
57
include_timestamps: Whether to receive the committed_transcript_with_timestamps event after committing the segment (optional, defaults to False)
52
58
"""
53
-
model_id: str
54
-
audio_format: AudioFormat
55
-
sample_rate: int
59
+
model_id: Required[str]
60
+
audio_format: Required[AudioFormat]
61
+
sample_rate: Required[int]
56
62
commit_strategy: CommitStrategy
57
63
vad_silence_threshold_secs: float
58
64
vad_threshold: float
@@ -77,8 +83,8 @@ class RealtimeUrlOptions(typing.TypedDict, total=False):
77
83
language_code: An ISO-639-1 or ISO-639-3 language_code corresponding to the language of the audio file. Can sometimes improve transcription performance if known beforehand.
78
84
include_timestamps: Whether to receive the committed_transcript_with_timestamps event after committing the segment (optional, defaults to False)
0 commit comments