Spaces:

fedirz
/

faster-whisper-server

Configuration error

Fedir Zadniprovskyi commited on May 27, 2024

Commit

47627a9

1 Parent(s): af41874

chore: misc

Files changed (5) hide show

.github/workflows/docker-build-and-push.yaml CHANGED Viewed

@@ -16,9 +16,9 @@ jobs:
         dockerfile: [Dockerfile.cuda, Dockerfile.cpu]
         include:
           - dockerfile: Dockerfile.cuda
-            tag-prefix: cuda-
           - dockerfile: Dockerfile.cpu
-            tag-prefix: cpu-
     steps:
       - uses: actions/checkout@v4
       - name: Login to Docker Hub
@@ -33,7 +33,8 @@ jobs:
             fedirz/faster-whisper-server
           # https://github.com/docker/metadata-action?tab=readme-ov-file#flavor-input
           flavor: |
-            prefix=${{ matrix.tag-prefix }}
           tags: |
             type=semver,pattern={{version}}
             type=semver,pattern={{major}}.{{minor}}

         dockerfile: [Dockerfile.cuda, Dockerfile.cpu]
         include:
           - dockerfile: Dockerfile.cuda
+            tag-suffix: -cuda
           - dockerfile: Dockerfile.cpu
+            tag-suffix: -cpu
     steps:
       - uses: actions/checkout@v4
       - name: Login to Docker Hub
             fedirz/faster-whisper-server
           # https://github.com/docker/metadata-action?tab=readme-ov-file#flavor-input
           flavor: |
+            latest=false
+            suffix=${{ matrix.tag-suffix}}
           tags: |
             type=semver,pattern={{version}}
             type=semver,pattern={{major}}.{{minor}}

Dockerfile.cpu CHANGED Viewed

@@ -15,7 +15,7 @@ RUN poetry install --only main
 COPY ./faster_whisper_server ./faster_whisper_server
 ENTRYPOINT ["poetry", "run"]
 CMD ["uvicorn", "faster_whisper_server.main:app"]
-ENV WHISPER_MODEL=distil-medium.en
 ENV WHISPER_INFERENCE_DEVICE=cpu
 ENV WHISPER_COMPUTE_TYPE=int8
 ENV UVICORN_HOST=0.0.0.0

 COPY ./faster_whisper_server ./faster_whisper_server
 ENTRYPOINT ["poetry", "run"]
 CMD ["uvicorn", "faster_whisper_server.main:app"]
+ENV WHISPER_MODEL=medium.en
 ENV WHISPER_INFERENCE_DEVICE=cpu
 ENV WHISPER_COMPUTE_TYPE=int8
 ENV UVICORN_HOST=0.0.0.0

README.md CHANGED Viewed

@@ -60,10 +60,10 @@ print(transcript.text)
 # If `model` isn't specified, the default model is used
 curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]"
 curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]"
-curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "streaming=true"
-curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "streaming=true" -F "model=distil-large-v3"
 # It's recommended that you always specify the language as that will reduce the transcription time
-curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "streaming=true" -F "model=distil-large-v3" -F "language=en"
 curl http://localhost:8000/v1/audio/translations -F "[email protected]"
 ```

 # If `model` isn't specified, the default model is used
 curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]"
 curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]"
+curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "stream=true"
+curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "stream=true" -F "model=distil-large-v3"
 # It's recommended that you always specify the language as that will reduce the transcription time
+curl http://localhost:8000/v1/audio/transcriptions -F "[email protected]" -F "stream=true" -F "model=distil-large-v3" -F "language=en"
 curl http://localhost:8000/v1/audio/translations -F "[email protected]"
 ```

faster_whisper_server/config.py CHANGED Viewed

@@ -163,7 +163,7 @@ class Language(enum.StrEnum):
 class WhisperConfig(BaseModel):
-    model: Model = Field(default=Model.DISTIL_MEDIUM_EN)
     inference_device: Device = Field(default=Device.AUTO)
     compute_type: Quantization = Field(default=Quantization.DEFAULT)

 class WhisperConfig(BaseModel):
+    model: Model = Field(default=Model.MEDIUM_EN)
     inference_device: Device = Field(default=Device.AUTO)
     compute_type: Quantization = Field(default=Quantization.DEFAULT)

faster_whisper_server/main.py CHANGED Viewed

@@ -58,7 +58,7 @@ def load_model(model_name: Model) -> WhisperModel:
         compute_type=config.whisper.compute_type,
     )
     logger.info(
-        f"Loaded {model_name} loaded in {time.perf_counter() - start:.2f} seconds"
     )
     models[model_name] = whisper
     return whisper

         compute_type=config.whisper.compute_type,
     )
     logger.info(
+        f"Loaded {model_name} loaded in {time.perf_counter() - start:.2f} seconds. {config.whisper.inference_device}({config.whisper.compute_type}) will be used for inference."
     )
     models[model_name] = whisper
     return whisper