rework structure of gradio app

2023-11-20 15:01:51 +01:00
parent f691790c00
commit bbb2c848e3
8 changed files with 484 additions and 507 deletions
@@ -0,0 +1,129 @@
+"""
+This file contains the actual gradio Interface which is used to interact with the user.
+"""
+
+import gradio as gr
+import os
+
+import scraibe.app.global_var as gv
+from .interactions import *
+from .stg import *
+
+from scraibe import Scraibe
+
+theme = gr.themes.Soft(
+    primary_hue="green",
+    secondary_hue='orange',
+    neutral_hue="gray",  
+)
+
+
+LANGUAGES = [
+    "Afrikaans", "Arabic", "Armenian", "Azerbaijani", "Belarusian",
+    "Bosnian", "Bulgarian", "Catalan", "Chinese", "Croatian",
+    "Czech", "Danish", "Dutch", "English", "Estonian",
+    "Finnish", "French", "Galician", "German", "Greek",
+    "Hebrew", "Hindi", "Hungarian", "Icelandic", "Indonesian",
+    "Italian", "Japanese", "Kannada", "Kazakh", "Korean",
+    "Latvian", "Lithuanian", "Macedonian", "Malay", "Marathi",
+    "Maori", "Nepali", "Norwegian", "Persian", "Polish",
+    "Portuguese", "Romanian", "Russian", "Serbian", "Slovak",
+    "Slovenian", "Spanish", "Swahili", "Swedish", "Tagalog",
+    "Tamil", "Thai", "Turkish", "Ukrainian", "Urdu",
+    "Vietnamese", "Welsh"
+]
+
+CURRENT_PATH = os.path.dirname(os.path.realpath(__file__))
+
+
+def gradio_Interface(pipe : Scraibe = None):
+    
+    if pipe is not None:
+        gv.MODEL = GradioTranscriptionInterface(pipe)
+    
+    with gr.Blocks(theme=theme,title='ScrAIbe: Automatic Audio Transcription') as demo:
+            
+            # Define components
+            hname = os.path.join(CURRENT_PATH, "header.html")
+            header = open(hname, "r").read()
+            
+            # ugly hack to get the logo to work
+            header = header.replace("/file=logo.svg", f"/file={CURRENT_PATH}/logo.svg" )
+            
+            gr.HTML(header, visible= True, show_label=False)
+            
+            with gr.Row():
+                
+                with gr.Column():
+                
+                    task = gr.Radio(["Auto Transcribe", "Transcribe", "Diarisation"], label="Task",
+                                    value= 'Auto Transcribe')
+                    
+                    num_speakers = gr.Number(value=0, label= "Number of speakers (optional)", 
+                                    info = "Number of speakers in the audio file. If you don't know,\
+                                        leave it at 0.", visible= True)
+                    
+                    translate = gr.Checkbox(label="Translation", choices=[True, False], value = False,
+                                    info="Select 'Yes' to have the output translated into English.",
+                                    visible= True)
+                    
+                    language = gr.Dropdown(LANGUAGES,
+                                    label="Language (optional)", value = "None",
+                                    info="Language of the audio file. If you don't know,\
+                                        leave it at None.", visible= True)
+                    
+                    input = gr.Radio(["Upload Audio", "Record Audio", "Upload Video","Record Video" 
+                                        ,"File or Files"], label="Input Type", value="Upload Audio")
+                    
+                    audio1 = gr.Audio(source="upload", type="filepath", label="Upload Audio",
+                                        interactive= True, visible= True)
+                    audio2 = gr.Audio(source="microphone", label="Record Audio", type="filepath",
+                                        interactive= True, visible= False)
+                    video1 = gr.Video(source="upload", type="filepath", label="Upload Video",
+                                        interactive= True, visible= False)
+                    video2 = gr.Video(source="webcam", label="Record Video", type="filepath",include_audio= True,
+                                        interactive= True, visible= False)
+                    file_in = gr.Files(label="Upload File or Files", interactive= True, visible= False)
+                    
+                    submit = gr.Button()
+                
+                with gr.Column():
+                    
+                    out_txt = gr.Textbox(label="Output",
+                                            visible= True, show_copy_button=True)
+                    
+                    out_json = gr.JSON(label="JSON Output",
+                                        visible= False, show_copy_button=True)
+                    
+                    annoation = gr.Textbox(label="Name your speaker's",
+                                        info= "Please provide a list of the speakers arranged \
+                                        in the order in which they appear in the input. Use comma ',' \
+                                        as a seperator. Be aware that the first name is given \
+                                            to SPEAKER_00 the second to SPEAKER_01 and so on.",
+                                        visible= False, interactive= True)
+                    
+                    annotate = gr.Button(value="Annotate", visible= False, interactive= True)
+                
+            # Define usage of components
+            input.change(fn=select_origin, inputs=[input],
+                            outputs=[audio1, audio2, video1, video2, file_in])
+            
+            task.change(fn=select_task, inputs=[task],
+                        outputs=[num_speakers, translate, language])
+            
+            translate.change(fn= lambda x : gr.update(value = x),
+                                inputs=[translate], outputs=[translate])
+            num_speakers.change(fn= lambda x : gr.update(value = x),
+                                inputs=[num_speakers], outputs=[num_speakers])
+            language.change(fn= lambda x : gr.update(value = x), 
+                            inputs=[language], outputs=[language])
+            
+            submit.click(fn = run_scraibe, 
+                            inputs=[task, num_speakers, translate, language, audio1,
+                                    audio2, video1, video2, file_in],
+                            outputs=[out_txt, out_json, annoation, annotate])
+            
+            annotate.click(fn = annotate_output, inputs=[annoation, out_json],
+                            outputs=[out_txt, out_json])
+            
+    return demo