made cli work with new interface

2024-01-25 16:08:53 +01:00
parent c65dc51541
commit ef7bd6e15c
3 changed files with 100 additions and 49 deletions
@@ -0,0 +1,28 @@
+"""
+This script is used to start the Gradio interface for audio transcription.
+A configuration file can be passed to the script to configure the interface.
+If no configuration file is passed, the default configuration is used.
+The main Reason for this script is to allow the use of multiprocessing in the app.
+"""
+
+import multiprocessing
+from scraibe.misc import ParseKwargs
+from argparse import ArgumentParser
+
+parser = ArgumentParser()
+
+parser.add_argument("--server-config", type=str, default= None,
+                        help="Path to the configy.yml file.")
+    
+parser.add_argument('--server-kwargs', nargs='*', action=ParseKwargs, default={},
+                    help='Keyword arguments for the Gradio app.')
+
+args = parser.parse_args()
+
+if __name__ == '__main__':
+    
+    multiprocessing.set_start_method('spawn')
+
+    from scraibe.app.app import app
+    
+    app(config = args.server_config, **args.server_kwargs)
@@ -5,10 +5,11 @@ The function includes arguments for specifying the audio files, model paths,
 output formats, and other options necessary for transcription.
 """
 import os 
-from argparse import ArgumentParser, ArgumentDefaultsHelpFormatter
+from argparse import ArgumentParser, ArgumentDefaultsHelpFormatter, Action
 import json

 from .autotranscript import Scraibe
+from .misc import ParseKwargs
 from .app.app import gradio_Interface

 from whisper.tokenizer import LANGUAGES , TO_LANGUAGE_CODE
@@ -41,13 +42,15 @@ def cli():
                        help="List of audio files to transcribe.")
    
    group.add_argument('--start-server', action='store_true',
-                        help='Start the Gradio app.')
+                        help='Start the Gradio app.' \
+                        'If set, all other arguments are ignored' \
+                        'besides --server-config or --server-kwargs.')
    
-    parser.add_argument("--port", type=int, default= None,
-                        help="Port to run the Gradio app on. Defaults to 7860.")
+    parser.add_argument("--server-config", type=str, default= None,
+                        help="Path to the configy.yml file.")
    
-    parser.add_argument("--server-name", type=str, default= None,
-                        help="Name of the Gradio app. If empty 127.0.0.1 or 0.0.0.0 will be used.")
+    parser.add_argument('--server-kwargs', nargs='*', action=ParseKwargs, default={},
+                        help='Keyword arguments for the Gradio app.')
                        
    parser.add_argument("--whisper-model-name", default="medium",
                        help="Name of the Whisper model to use.")
@@ -66,7 +69,8 @@ def cli():
                        help="Device to use for PyTorch inference.")

    parser.add_argument("--num-threads", type=int, default=0,
-                        help="Number of threads used by torch for CPU inference; overrides MKL_NUM_THREADS/OMP_NUM_THREADS.")
+                        help="Number of threads used by torch for CPU inference; '\
+                            'overrides MKL_NUM_THREADS/OMP_NUM_THREADS.")

    parser.add_argument("--output-directory", "-o", type=str, default=".",
                        help="Directory to save the transcription outputs.")
@@ -113,8 +117,9 @@ def cli():
    if arg_dict["whisper_model_directory"]:
        class_kwargs["download_root"] = arg_dict.pop("whisper_model_directory")

-    model = Scraibe(**class_kwargs)
+    if not start_server:
        
+        model = Scraibe(**class_kwargs)

        if arg_dict["audio_files"]:
            audio_files = arg_dict.pop("audio_files")
@@ -158,10 +163,13 @@ def cli():
                        f.write(out)  
                    
    
-    if start_server: # unfinished code
+    else: # unfinished code
+        import subprocess
+        import sys
        
-        gradio_Interface(model).queue().launch(server_port=args.port, server_name=args.server_name)
+        execute_path = os.path.join(os.path.dirname(__file__), "app/app_starter.py")
        
+        subprocess.run([sys.executable, execute_path])

 if __name__ == "__main__":
    cli()
@@ -1,6 +1,7 @@
 import os
 import yaml
 from pyannote.audio.core.model import CACHE_DIR as PYANNOTE_CACHE_DIR
+from argparse import Action

 CACHE_DIR = os.getenv(
    "AUTOT_CACHE",
@@ -38,3 +39,17 @@ def config_diarization_yaml(file_path: str, path_to_segmentation: str = None) ->

    with open(file_path, "w") as stream:
        yaml.dump(yml, stream)
+
+class ParseKwargs(Action):
+    """
+    Custom argparse action to parse keyword arguments.
+    """
+    def __call__(self, parser, namespace, values, option_string=None):
+        setattr(namespace, self.dest, dict())
+        for value in values:
+            key, value = value.split('=')
+            try:
+                value = eval(value)
+            except:
+                pass
+            getattr(namespace, self.dest)[key] = value