Spaces:

fedirz
/

faster-whisper-server

Configuration error

Fedir Zadniprovskyi commited on May 25, 2024

Commit

db500b1

1 Parent(s): 3431d63

chore: allow configuring the default language and response format

Files changed (2) hide show

speaches/config.py CHANGED Viewed

@@ -3,6 +3,8 @@ import enum
 from pydantic import BaseModel, Field
 from pydantic_settings import BaseSettings, SettingsConfigDict
 SAMPLES_PER_SECOND = 16000
 BYTES_PER_SAMPLE = 2
 BYTES_PER_SECOND = SAMPLES_PER_SECOND * BYTES_PER_SAMPLE
@@ -167,6 +169,10 @@ class Config(BaseSettings):
     model_config = SettingsConfigDict(env_nested_delimiter="_")
     log_level: str = "info"  # ENV: LOG_LEVEL
     whisper: WhisperConfig = WhisperConfig()  # ENV: WHISPER_*
     """
     Max duration to for the next audio chunk before transcription is finilized and connection is closed.

 from pydantic import BaseModel, Field
 from pydantic_settings import BaseSettings, SettingsConfigDict
+from speaches.server_models import ResponseFormat
 SAMPLES_PER_SECOND = 16000
 BYTES_PER_SAMPLE = 2
 BYTES_PER_SECOND = SAMPLES_PER_SECOND * BYTES_PER_SAMPLE
     model_config = SettingsConfigDict(env_nested_delimiter="_")
     log_level: str = "info"  # ENV: LOG_LEVEL
+    default_language: Language | None = None  # ENV: DEFAULT_LANGUAGE
+    default_response_format: ResponseFormat = (
+        ResponseFormat.JSON
+    )  # ENV: DEFAULT_RESPONSE_FORMAT
     whisper: WhisperConfig = WhisperConfig()  # ENV: WHISPER_*
     """
     Max duration to for the next audio chunk before transcription is finilized and connection is closed.

speaches/main.py CHANGED Viewed

@@ -55,7 +55,7 @@ async def translate_file(
     file: Annotated[UploadFile, Form()],
     model: Annotated[Model, Form()] = config.whisper.model,
     prompt: Annotated[str | None, Form()] = None,
-    response_format: Annotated[ResponseFormat, Form()] = ResponseFormat.JSON,
     temperature: Annotated[float, Form()] = 0.0,
     stream: Annotated[bool, Form()] = False,
 ):
@@ -108,9 +108,9 @@ async def translate_file(
 async def transcribe_file(
     file: Annotated[UploadFile, Form()],
     model: Annotated[Model, Form()] = config.whisper.model,
-    language: Annotated[Language | None, Form()] = None,
     prompt: Annotated[str | None, Form()] = None,
-    response_format: Annotated[ResponseFormat, Form()] = ResponseFormat.JSON,
     temperature: Annotated[float, Form()] = 0.0,
     timestamp_granularities: Annotated[
         list[Literal["segments"] | Literal["words"]],
@@ -223,9 +223,9 @@ def format_transcription(
 async def transcribe_stream(
     ws: WebSocket,
     model: Annotated[Model, Query()] = config.whisper.model,
-    language: Annotated[Language | None, Query()] = None,
     prompt: Annotated[str | None, Query()] = None,
-    response_format: Annotated[ResponseFormat, Query()] = ResponseFormat.JSON,
     temperature: Annotated[float, Query()] = 0.0,
     timestamp_granularities: Annotated[
         list[Literal["segments"] | Literal["words"]],

     file: Annotated[UploadFile, Form()],
     model: Annotated[Model, Form()] = config.whisper.model,
     prompt: Annotated[str | None, Form()] = None,
+    response_format: Annotated[ResponseFormat, Form()] = config.default_response_format,
     temperature: Annotated[float, Form()] = 0.0,
     stream: Annotated[bool, Form()] = False,
 ):
 async def transcribe_file(
     file: Annotated[UploadFile, Form()],
     model: Annotated[Model, Form()] = config.whisper.model,
+    language: Annotated[Language | None, Form()] = config.default_language,
     prompt: Annotated[str | None, Form()] = None,
+    response_format: Annotated[ResponseFormat, Form()] = config.default_response_format,
     temperature: Annotated[float, Form()] = 0.0,
     timestamp_granularities: Annotated[
         list[Literal["segments"] | Literal["words"]],
 async def transcribe_stream(
     ws: WebSocket,
     model: Annotated[Model, Query()] = config.whisper.model,
+    language: Annotated[Language | None, Query()] = config.default_language,
     prompt: Annotated[str | None, Query()] = None,
+    response_format: Annotated[ResponseFormat, Query()] = config.default_response_format,
     temperature: Annotated[float, Query()] = 0.0,
     timestamp_granularities: Annotated[
         list[Literal["segments"] | Literal["words"]],