Spaces:

fedirz
/

faster-whisper-server

Configuration error

faster-whisper-server / src /faster_whisper_server /gradio_app.py

Fedir Zadniprovskyi

chore: fix some ruff errors

42343e0 4 months ago

4.16 kB

	from collections.abc import Generator
	from pathlib import Path

	import gradio as gr
	import httpx
	from httpx_sse import connect_sse
	from openai import OpenAI

	from faster_whisper_server.config import Config, Task

	TRANSCRIPTION_ENDPOINT = "/v1/audio/transcriptions"
	TRANSLATION_ENDPOINT = "/v1/audio/translations"
	TIMEOUT_SECONDS = 180
	TIMEOUT = httpx.Timeout(timeout=TIMEOUT_SECONDS)


	def create_gradio_demo(config: Config) -> gr.Blocks:
	base_url = f"http://{config.host}:{config.port}"
	http_client = httpx.Client(base_url=base_url, timeout=TIMEOUT)
	openai_client = OpenAI(base_url=f"{base_url}/v1", api_key="cant-be-empty")

	def handler(file_path: str, model: str, task: Task, temperature: float, stream: bool) -> Generator[str, None, None]:
	if task == Task.TRANSCRIBE:
	endpoint = TRANSCRIPTION_ENDPOINT
	elif task == Task.TRANSLATE:
	endpoint = TRANSLATION_ENDPOINT

	if stream:
	previous_transcription = ""
	for transcription in streaming_audio_task(file_path, endpoint, temperature, model):
	previous_transcription += transcription
	yield previous_transcription
	else:
	yield audio_task(file_path, endpoint, temperature, model)

	def audio_task(file_path: str, endpoint: str, temperature: float, model: str) -> str:
	with Path(file_path).open("rb") as file:
	response = http_client.post(
	endpoint,
	files={"file": file},
	data={
	"model": model,
	"response_format": "text",
	"temperature": temperature,
	},
	)

	response.raise_for_status()
	return response.text

	def streaming_audio_task(
	file_path: str, endpoint: str, temperature: float, model: str
	) -> Generator[str, None, None]:
	with Path(file_path).open("rb") as file:
	kwargs = {
	"files": {"file": file},
	"data": {
	"response_format": "text",
	"temperature": temperature,
	"model": model,
	"stream": True,
	},
	}
	with connect_sse(http_client, "POST", endpoint, **kwargs) as event_source:
	for event in event_source.iter_sse():
	yield event.data

	def update_model_dropdown() -> gr.Dropdown:
	models = openai_client.models.list().data
	model_names: list[str] = [model.id for model in models]
	assert config.whisper.model in model_names
	recommended_models = {model for model in model_names if model.startswith("Systran")}
	other_models = [model for model in model_names if model not in recommended_models]
	model_names = list(recommended_models) + other_models
	return gr.Dropdown(
	# no idea why it's complaining
	choices=model_names, # pyright: ignore[reportArgumentType]
	label="Model",
	value=config.whisper.model,
	)

	model_dropdown = gr.Dropdown(
	choices=[config.whisper.model],
	label="Model",
	value=config.whisper.model,
	)
	task_dropdown = gr.Dropdown(
	choices=[task.value for task in Task],
	label="Task",
	value=Task.TRANSCRIBE,
	)
	temperature_slider = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, label="Temperature", value=0.0)
	stream_checkbox = gr.Checkbox(label="Stream", value=True)
	with gr.Interface(
	title="Whisper Playground",
	description="""Consider supporting the project by starring the <a href="https://github.com/fedirz/faster-whisper-server">repository on GitHub</a>.""", # noqa: E501
	inputs=[
	gr.Audio(type="filepath"),
	model_dropdown,
	task_dropdown,
	temperature_slider,
	stream_checkbox,
	],
	fn=handler,
	outputs="text",
	analytics_enabled=False, # disable telemetry
	) as demo:
	demo.load(update_model_dropdown, inputs=None, outputs=model_dropdown)
	return demo