Spaces:

jhj0517
/

Whisper-WebUI

Running

App Files Files Community

jhj0517 commited on Sep 24, 2024

Commit

29cce95

unverified ·

2 Parent(s): 6a7425a aa11c47

Merge pull request #290 from jhj0517/fix/defaults

Browse files

Files changed (6) hide show

modules/translation/nllb_inference.py +1 -1
modules/translation/translation_base.py +1 -1
modules/whisper/faster_whisper_inference.py +2 -2
modules/whisper/insanely_fast_whisper_inference.py +2 -2
modules/whisper/whisper_Inference.py +2 -2
modules/whisper/whisper_base.py +13 -12

modules/translation/nllb_inference.py CHANGED Viewed

@@ -35,7 +35,7 @@ class NLLBInference(TranslationBase):
                      model_size: str,
                      src_lang: str,
                      tgt_lang: str,
-                     progress: gr.Progress
                      ):
         if model_size != self.current_model_size or self.model is None:
             print("\nInitializing NLLB Model..\n")

                      model_size: str,
                      src_lang: str,
                      tgt_lang: str,
+                     progress: gr.Progress = gr.Progress()
                      ):
         if model_size != self.current_model_size or self.model is None:
             print("\nInitializing NLLB Model..\n")

modules/translation/translation_base.py CHANGED Viewed

@@ -37,7 +37,7 @@ class TranslationBase(ABC):
                      model_size: str,
                      src_lang: str,
                      tgt_lang: str,
-                     progress: gr.Progress
                      ):
         pass

                      model_size: str,
                      src_lang: str,
                      tgt_lang: str,
+                     progress: gr.Progress = gr.Progress()
                      ):
         pass

modules/whisper/faster_whisper_inference.py CHANGED Viewed

@@ -40,7 +40,7 @@ class FasterWhisperInference(WhisperBase):
     def transcribe(self,
                    audio: Union[str, BinaryIO, np.ndarray],
-                   progress: gr.Progress,
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
@@ -126,7 +126,7 @@ class FasterWhisperInference(WhisperBase):
     def update_model(self,
                      model_size: str,
                      compute_type: str,
-                     progress: gr.Progress
                      ):
         """
         Update current model setting

     def transcribe(self,
                    audio: Union[str, BinaryIO, np.ndarray],
+                   progress: gr.Progress = gr.Progress(),
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
     def update_model(self,
                      model_size: str,
                      compute_type: str,
+                     progress: gr.Progress = gr.Progress()
                      ):
         """
         Update current model setting

modules/whisper/insanely_fast_whisper_inference.py CHANGED Viewed

@@ -39,7 +39,7 @@ class InsanelyFastWhisperInference(WhisperBase):
     def transcribe(self,
                    audio: Union[str, np.ndarray, torch.Tensor],
-                   progress: gr.Progress,
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
@@ -98,7 +98,7 @@ class InsanelyFastWhisperInference(WhisperBase):
     def update_model(self,
                      model_size: str,
                      compute_type: str,
-                     progress: gr.Progress,
                      ):
         """
         Update current model setting

     def transcribe(self,
                    audio: Union[str, np.ndarray, torch.Tensor],
+                   progress: gr.Progress = gr.Progress(),
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
     def update_model(self,
                      model_size: str,
                      compute_type: str,
+                     progress: gr.Progress = gr.Progress(),
                      ):
         """
         Update current model setting

modules/whisper/whisper_Inference.py CHANGED Viewed

@@ -28,7 +28,7 @@ class WhisperInference(WhisperBase):
     def transcribe(self,
                    audio: Union[str, np.ndarray, torch.Tensor],
-                   progress: gr.Progress,
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
@@ -79,7 +79,7 @@ class WhisperInference(WhisperBase):
     def update_model(self,
                      model_size: str,
                      compute_type: str,
-                     progress: gr.Progress,
                      ):
         """
         Update current model setting

     def transcribe(self,
                    audio: Union[str, np.ndarray, torch.Tensor],
+                   progress: gr.Progress = gr.Progress(),
                    *whisper_params,
                    ) -> Tuple[List[dict], float]:
         """
     def update_model(self,
                      model_size: str,
                      compute_type: str,
+                     progress: gr.Progress = gr.Progress(),
                      ):
         """
         Update current model setting

modules/whisper/whisper_base.py CHANGED Viewed

@@ -53,7 +53,7 @@ class WhisperBase(ABC):
     @abstractmethod
     def transcribe(self,
                    audio: Union[str, BinaryIO, np.ndarray],
-                   progress: gr.Progress,
                    *whisper_params,
                    ):
         """Inference whisper model to transcribe"""
@@ -63,7 +63,7 @@ class WhisperBase(ABC):
     def update_model(self,
                      model_size: str,
                      compute_type: str,
-                     progress: gr.Progress
                      ):
         """Initialize whisper model"""
         pass
@@ -171,10 +171,10 @@ class WhisperBase(ABC):
         return result, elapsed_time
     def transcribe_file(self,
-                        files: list,
-                        input_folder_path: str,
-                        file_format: str,
-                        add_timestamp: bool,
                         progress=gr.Progress(),
                         *whisper_params,
                         ) -> list:
@@ -250,8 +250,8 @@ class WhisperBase(ABC):
     def transcribe_mic(self,
                        mic_audio: str,
-                       file_format: str,
-                       add_timestamp: bool,
                        progress=gr.Progress(),
                        *whisper_params,
                        ) -> list:
@@ -306,8 +306,8 @@ class WhisperBase(ABC):
     def transcribe_youtube(self,
                            youtube_link: str,
-                           file_format: str,
-                           add_timestamp: bool,
                            progress=gr.Progress(),
                            *whisper_params,
                            ) -> list:
@@ -411,11 +411,12 @@ class WhisperBase(ABC):
         else:
             output_path = os.path.join(output_dir, f"{file_name}")
-        if file_format == "SRT":
             content = get_srt(transcribed_segments)
             output_path += '.srt'
-        elif file_format == "WebVTT":
             content = get_vtt(transcribed_segments)
             output_path += '.vtt'

     @abstractmethod
     def transcribe(self,
                    audio: Union[str, BinaryIO, np.ndarray],
+                   progress: gr.Progress = gr.Progress(),
                    *whisper_params,
                    ):
         """Inference whisper model to transcribe"""
     def update_model(self,
                      model_size: str,
                      compute_type: str,
+                     progress: gr.Progress = gr.Progress()
                      ):
         """Initialize whisper model"""
         pass
         return result, elapsed_time
     def transcribe_file(self,
+                        files: Optional[List] = None,
+                        input_folder_path: Optional[str] = None,
+                        file_format: str = "SRT",
+                        add_timestamp: bool = True,
                         progress=gr.Progress(),
                         *whisper_params,
                         ) -> list:
     def transcribe_mic(self,
                        mic_audio: str,
+                       file_format: str = "SRT",
+                       add_timestamp: bool = True,
                        progress=gr.Progress(),
                        *whisper_params,
                        ) -> list:
     def transcribe_youtube(self,
                            youtube_link: str,
+                           file_format: str = "SRT",
+                           add_timestamp: bool = True,
                            progress=gr.Progress(),
                            *whisper_params,
                            ) -> list:
         else:
             output_path = os.path.join(output_dir, f"{file_name}")
+        file_format = file_format.strip().lower()
+        if file_format == "srt":
             content = get_srt(transcribed_segments)
             output_path += '.srt'
+        elif file_format == "webvtt":
             content = get_vtt(transcribed_segments)
             output_path += '.vtt'