Spaces:

fedirz
/

faster-whisper-server

Configuration error

App Files Files Community

Fedir Zadniprovskyi commited on May 23, 2024

Commit

a9ee91b

1 Parent(s): e1a6910

refactor: simplify tests

Browse files

Files changed (1) hide show

tests/app_test.py +33 -28

tests/app_test.py CHANGED Viewed

@@ -15,6 +15,9 @@ from speaches.main import app
 from speaches.server_models import TranscriptionVerboseResponse
 SIMILARITY_THRESHOLD = 0.97
 @pytest.fixture()
@@ -23,12 +26,17 @@ def client() -> Generator[TestClient, None, None]:
         yield client
 def get_audio_file_paths():
     file_paths = []
     directory = "tests/data"
-    for filename in reversed(os.listdir(directory)[5:6]):
-        if filename.endswith(".raw"):
-            file_paths.append(os.path.join(directory, filename))
     return file_paths
@@ -48,7 +56,7 @@ def transcribe_audio_data(
     client: TestClient, data: bytes
 ) -> TranscriptionVerboseResponse:
     response = client.post(
-        "/v1/audio/transcriptions?response_format=verbose_json",
         files={"file": ("audio.raw", data, "audio/raw")},
     )
     data = json.loads(response.json())  # TODO: figure this out
@@ -56,29 +64,26 @@ def transcribe_audio_data(
 @pytest.mark.parametrize("file_path", file_paths)
-def test_ws_audio_transcriptions(client: TestClient, file_path: str):
     with open(file_path, "rb") as file:
         data = file.read()
-        streaming_transcription: TranscriptionVerboseResponse = None  # type: ignore
-        with client.websocket_connect(
-            "/v1/audio/transcriptions?response_format=verbose_json"
-        ) as ws:
-            thread = threading.Thread(
-                target=stream_audio_data, args=(ws, data), kwargs={"speed": 4.0}
-            )
-            thread.start()
-            while True:
-                try:
-                    streaming_transcription = TranscriptionVerboseResponse(
-                        **ws.receive_json()
-                    )
-                except WebSocketDisconnect:
-                    break
-            ws.close()
-        file_transcription = transcribe_audio_data(client, data)
-        s = SequenceMatcher(
-            lambda x: x == " ", file_transcription.text, streaming_transcription.text
-        )
-        assert (
-            s.ratio() > SIMILARITY_THRESHOLD
-        ), f"\nExpected: {file_transcription.text}\nReceived: {streaming_transcription.text}"

 from speaches.server_models import TranscriptionVerboseResponse
 SIMILARITY_THRESHOLD = 0.97
+AUDIO_FILES_LIMIT = 5
+AUDIO_FILE_DIR = "tests/data"
+TRANSCRIBE_ENDPOINT = "/v1/audio/transcriptions?response_format=verbose_json"
 @pytest.fixture()
         yield client
+@pytest.fixture()
+def ws(client: TestClient) -> Generator[WebSocketTestSession, None, None]:
+    with client.websocket_connect(TRANSCRIBE_ENDPOINT) as ws:
+        yield ws
 def get_audio_file_paths():
     file_paths = []
     directory = "tests/data"
+    for filename in sorted(os.listdir(directory)[:AUDIO_FILES_LIMIT]):
+        file_paths.append(os.path.join(directory, filename))
     return file_paths
     client: TestClient, data: bytes
 ) -> TranscriptionVerboseResponse:
     response = client.post(
+        TRANSCRIBE_ENDPOINT,
         files={"file": ("audio.raw", data, "audio/raw")},
     )
     data = json.loads(response.json())  # TODO: figure this out
 @pytest.mark.parametrize("file_path", file_paths)
+def test_ws_audio_transcriptions(
+    client: TestClient, ws: WebSocketTestSession, file_path: str
+):
     with open(file_path, "rb") as file:
         data = file.read()
+    streaming_transcription: TranscriptionVerboseResponse = None  # type: ignore
+    thread = threading.Thread(
+        target=stream_audio_data, args=(ws, data), kwargs={"speed": 4.0}
+    )
+    thread.start()
+    while True:
+        try:
+            streaming_transcription = TranscriptionVerboseResponse(**ws.receive_json())
+        except WebSocketDisconnect:
+            break
+    file_transcription = transcribe_audio_data(client, data)
+    s = SequenceMatcher(
+        lambda x: x == " ", file_transcription.text, streaming_transcription.text
+    )
+    assert (
+        s.ratio() > SIMILARITY_THRESHOLD
+    ), f"\nExpected: {file_transcription.text}\nReceived: {streaming_transcription.text}"