Spaces:
Configuration error
Configuration error
from collections.abc import Generator | |
from pathlib import Path | |
import gradio as gr | |
import httpx | |
from httpx_sse import connect_sse | |
from openai import OpenAI | |
from faster_whisper_server.config import Config, Task | |
TRANSCRIPTION_ENDPOINT = "/v1/audio/transcriptions" | |
TRANSLATION_ENDPOINT = "/v1/audio/translations" | |
TIMEOUT_SECONDS = 180 | |
TIMEOUT = httpx.Timeout(timeout=TIMEOUT_SECONDS) | |
def create_gradio_demo(config: Config) -> gr.Blocks: | |
base_url = f"http://{config.host}:{config.port}" | |
http_client = httpx.Client(base_url=base_url, timeout=TIMEOUT) | |
openai_client = OpenAI(base_url=f"{base_url}/v1", api_key="cant-be-empty") | |
def handler(file_path: str, model: str, task: Task, temperature: float, stream: bool) -> Generator[str, None, None]: | |
if task == Task.TRANSCRIBE: | |
endpoint = TRANSCRIPTION_ENDPOINT | |
elif task == Task.TRANSLATE: | |
endpoint = TRANSLATION_ENDPOINT | |
if stream: | |
previous_transcription = "" | |
for transcription in streaming_audio_task(file_path, endpoint, temperature, model): | |
previous_transcription += transcription | |
yield previous_transcription | |
else: | |
yield audio_task(file_path, endpoint, temperature, model) | |
def audio_task(file_path: str, endpoint: str, temperature: float, model: str) -> str: | |
with Path(file_path).open("rb") as file: | |
response = http_client.post( | |
endpoint, | |
files={"file": file}, | |
data={ | |
"model": model, | |
"response_format": "text", | |
"temperature": temperature, | |
}, | |
) | |
response.raise_for_status() | |
return response.text | |
def streaming_audio_task( | |
file_path: str, endpoint: str, temperature: float, model: str | |
) -> Generator[str, None, None]: | |
with Path(file_path).open("rb") as file: | |
kwargs = { | |
"files": {"file": file}, | |
"data": { | |
"response_format": "text", | |
"temperature": temperature, | |
"model": model, | |
"stream": True, | |
}, | |
} | |
with connect_sse(http_client, "POST", endpoint, **kwargs) as event_source: | |
for event in event_source.iter_sse(): | |
yield event.data | |
def update_model_dropdown() -> gr.Dropdown: | |
models = openai_client.models.list().data | |
model_names: list[str] = [model.id for model in models] | |
assert config.whisper.model in model_names | |
recommended_models = {model for model in model_names if model.startswith("Systran")} | |
other_models = [model for model in model_names if model not in recommended_models] | |
model_names = list(recommended_models) + other_models | |
return gr.Dropdown( | |
# no idea why it's complaining | |
choices=model_names, # pyright: ignore[reportArgumentType] | |
label="Model", | |
value=config.whisper.model, | |
) | |
model_dropdown = gr.Dropdown( | |
choices=[config.whisper.model], | |
label="Model", | |
value=config.whisper.model, | |
) | |
task_dropdown = gr.Dropdown( | |
choices=[task.value for task in Task], | |
label="Task", | |
value=Task.TRANSCRIBE, | |
) | |
temperature_slider = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, label="Temperature", value=0.0) | |
stream_checkbox = gr.Checkbox(label="Stream", value=True) | |
with gr.Interface( | |
title="Whisper Playground", | |
description="""Consider supporting the project by starring the <a href="https://github.com/fedirz/faster-whisper-server">repository on GitHub</a>.""", # noqa: E501 | |
inputs=[ | |
gr.Audio(type="filepath"), | |
model_dropdown, | |
task_dropdown, | |
temperature_slider, | |
stream_checkbox, | |
], | |
fn=handler, | |
outputs="text", | |
analytics_enabled=False, # disable telemetry | |
) as demo: | |
demo.load(update_model_dropdown, inputs=None, outputs=model_dropdown) | |
return demo | |