Skip to content

Commit

Permalink
chore: adjust live transcription defaults and add descriptions
Browse files Browse the repository at this point in the history
  • Loading branch information
Fedir Zadniprovskyi authored and fedirz committed Aug 27, 2024
1 parent f46133f commit 000ea9d
Showing 1 changed file with 13 additions and 3 deletions.
16 changes: 13 additions & 3 deletions faster_whisper_server/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -184,20 +184,30 @@ class Config(BaseSettings):
"""

default_language: Language | None = None
"""
Default language to use for transcription. If not set, the language will be detected automatically.
It is recommended to set this as it will improve the performance.
"""
default_response_format: ResponseFormat = ResponseFormat.JSON
whisper: WhisperConfig = WhisperConfig()
max_models: int = 1
"""
Maximum number of models that can be loaded at a time.
"""
max_no_data_seconds: float = 1.0
"""
Max duration to for the next audio chunk before transcription is finilized and connection is closed.
Max duration to wait for the next audio chunk before transcription is finilized and connection is closed.
"""
min_duration: float = 1.0
"""
Minimum duration of an audio chunk that will be transcribed.
"""
word_timestamp_error_margin: float = 0.2
max_inactivity_seconds: float = 5.0
max_inactivity_seconds: float = 2.5
"""
Max allowed audio duration without any speech being detected before transcription is finilized and connection is closed.
""" # noqa: E501
inactivity_window_seconds: float = 10.0
inactivity_window_seconds: float = 5.0
"""
Controls how many latest seconds of audio are being passed through VAD.
Should be greater than `max_inactivity_seconds`
Expand Down

0 comments on commit 000ea9d

Please sign in to comment.