From 485a32cd514bdd998732fe5fc29b3ed0d9e81c94 Mon Sep 17 00:00:00 2001
From: Jacob Schmieder <Jacob.Schmieder@dbfz.de>
Date: Fri, 22 Sep 2023 18:16:46 +0200
Subject: [PATCH] Delete app2.py

Identical copy of scraibe/app/gradio_app.py
---
 app2.py | 317 --------------------------------------------------------
 1 file changed, 317 deletions(-)
 delete mode 100644 app2.py

diff --git a/app2.py b/app2.py
deleted file mode 100644
index 55cb11b..0000000
--- a/app2.py
+++ /dev/null
@@ -1,317 +0,0 @@
-"""
-Gradio Audio Transcription App.
---------------------------------
-
-This module provides an interface to transcribe audio files using the 
-AutoTranscribe model. Users can either upload an audio file or record their speech 
-live for transcription. The application supports multiple languages and provides 
-options to specify the number of speakers and the language of the audio.
-
-Attributes:
-    LANGUAGES (list): A list of supported languages for transcription.
-
-Usage:
-    Run this script to start the Gradio web interface for audio transcription.
-    
-"""
-
-
-import json
-
-import gradio as gr
-from scraibe import AutoTranscribe, Transcript
-
-
-
-theme = gr.themes.Soft(
-    primary_hue="green",
-    secondary_hue='orange',
-    neutral_hue="gray",
-    
-)
-LANGUAGES = [
-    "Afrikaans", "Arabic", "Armenian", "Azerbaijani", "Belarusian",
-    "Bosnian", "Bulgarian", "Catalan", "Chinese", "Croatian",
-    "Czech", "Danish", "Dutch", "English", "Estonian",
-    "Finnish", "French", "Galician", "German", "Greek",
-    "Hebrew", "Hindi", "Hungarian", "Icelandic", "Indonesian",
-    "Italian", "Japanese", "Kannada", "Kazakh", "Korean",
-    "Latvian", "Lithuanian", "Macedonian", "Malay", "Marathi",
-    "Maori", "Nepali", "Norwegian", "Persian", "Polish",
-    "Portuguese", "Romanian", "Russian", "Serbian", "Slovak",
-    "Slovenian", "Spanish", "Swahili", "Swedish", "Tagalog",
-    "Tamil", "Thai", "Turkish", "Ukrainian", "Urdu",
-    "Vietnamese", "Welsh"
-]
-
-class GradioTranscriptionInterface:
-    """
-    Interface handling the interaction between Gradio UI and the Audio Transcription system.
-    """
-
-    def __init__(self, model: AutoTranscribe = AutoTranscribe()):
-        """
-        Initializes the GradioTranscriptionInterface with a transcription model.
-
-        Args:
-            model (AutoTranscribe): Model responsible for audio transcription tasks.
-        """
-        self.model = model
-
-    def auto_transcribe(self, source,
-                        num_speakers : int,
-                        translation : bool,
-                        language : str):
-        """
-        Shortcut method for the AutoTranscribe task.
-
-        Returns:
-            tuple: Transcribed text (str), JSON output (dict)
-        """
-        
-        kwargs = {
-            "num_speakers": num_speakers if num_speakers != 0 else None,
-            "language": language if language != "None" else None,
-            "task": 'translate' if translation else None
-        }
-        
-        try:
-            result = self.model.autotranscribe(source, **kwargs)
-        except ValueError:
-            raise gr.Error("Couldn't detect any speech in the provided audio. \
-                    Please try again!")
-        return str(result), result.get_json()
-
-
-    def transcribe(self, source, translation, language):
-        """
-        Shortcut method for the Transcribe task.
-
-        Returns:
-            str: Transcribed text.
-        """
-        kwargs = {
-            "language": language if language != "None" else None,
-            "task": 'translate' if translation == "Yes" else None
-        }
-        
-        result = self.model.transcribe(source, **kwargs)
-        return str(result)
-
-    def perform_diarisation(self, source, num_speakers):
-        """
-        Shortcut method for the Diarisation task.
-
-        Returns:
-            str: JSON output of diarisation result.
-        """
-        kwargs = {
-            "num_speakers": num_speakers if num_speakers != 0 else None,
-        }
-        
-        
-        try:
-            result = self.model.diarization(source, **kwargs)
-        except ValueError:
-            raise gr.Error("Couldn't detect any speech in the provided audio. \
-                    Please try again!")
-        return json.dumps(result, indent=2)
-
-####
-# Gradio Interface
-####
-
-pipe = GradioTranscriptionInterface()
-
-
-def select_task(choice):
-    if choice == 'Auto Transcribe':
-        
-        return (gr.update(visible = True),
-                gr.update(visible = True),
-                gr.update(visible = True))
-                
-        
-    elif choice == 'Transcribe':
-        
-        return (gr.update(visible = False),
-                gr.update(visible = True),
-                gr.update(visible = True))
-
-        
-    elif choice == 'Diarisation':
-        
-        return (gr.update(visible = True),
-                gr.update(visible = False),
-                gr.update(visible = False))
-    
-def select_origin(choice):
-    if choice == "Upload Audio":
-        
-        return (gr.update(visible = True),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None))
-    
-    elif choice == "Record Audio":
-        
-        return (gr.update(visible = False, value = None),
-                gr.update(visible = True),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None))
-
-    elif choice == "Upload Video":
-        
-        return (gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = True),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None))
-    
-    elif choice == "Record Video":
-        
-        return (gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = True),
-                gr.update(visible = False, value = None))
-        
-    elif choice == "File":
-        
-        return (gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = False, value = None),
-                gr.update(visible = True))
-
-def run_scribe(task, num_speakers, translate, language, audio1, audio2, video1, video2, file_in, progress = gr.Progress(track_tqdm= True)):
-    # get *args which are not None
-    progress(0, desc='Starting task...')
-    source = audio1 or audio2 or video1 or video2 or file_in
-    
-    if task == 'Auto Transcribe':
-        
-        out_str , out_json = pipe.auto_transcribe(source = source,
-                             num_speakers = num_speakers,
-                             translation = translate,
-                             language = language)
-        
-        return (gr.update(value = out_str, visible = True),
-                gr.update(value = out_json, visible = True),
-                gr.update(visible = True),
-                gr.update(visible = True))        
-        
-    elif task == 'Transcribe':
-        
-        out = pipe.transcribe(source = source,
-                             translation = translate,
-                             language = language)
-        
-        return (gr.update(value = out, visible = True),
-                gr.update(value = None, visible = False),
-                gr.update(visible = False),
-                gr.update(visible = False))
-        
-    elif task == 'Diarisation':
-        
-        out = pipe.perform_diarisation(source = source,
-                             num_speakers = num_speakers)
-        
-        return (gr.update(value = None, visible = False),
-                gr.update(value = out, visible = True),
-                gr.update(visible = False),
-                gr.update(visible = False))
-    
-def annotate_output(annoation : str, out_json : dict):
-    # get *args which are not None
-    
-    trans = Transcript.from_json(out_json)
-    trans = trans.annotate(*annoation.split(","))
-
-    return gr.update(value = str(trans)),gr.update(value = trans.get_json())
-    
-    
-with gr.Blocks(theme=theme,title='ScrAIbe: Automatic Audio Transcription') as demo:
-    
-    # Define components
-    header = open("header.html", "r").read()
-    gr.HTML(header,  visible= True, show_label=False)
-    
-    with gr.Row():
-        
-        with gr.Column():
-        
-            task = gr.Radio(["Auto Transcribe", "Transcribe", "Diarisation"], label="Task",
-                            value= 'Auto Transcribe')
-            
-            num_speakers = gr.Number(value=0, label= "Number of speakers (optional)", 
-                            info = "Number of speakers in the audio file. If you don't know,\
-                                leave it at 0.", visible= True)
-            
-            translate = gr.Checkbox(label="Translation", choices=[True, False], value = False,
-                            info="Select 'Yes' to have the output translated into English.",
-                            visible= True)
-            
-            language = gr.Dropdown(LANGUAGES,
-                            label="Language (optional)", value = "None",
-                            info="Language of the audio file. If you don't know,\
-                                leave it at None.", visible= True)
-            
-            input = gr.Radio(["Upload Audio", "Record Audio", "Upload Video","Record Video" 
-                                ,"File"], label="Input Type", value="Upload Audio")
-            
-            audio1 = gr.Audio(source="upload", type="filepath", label="Upload Audio",
-                                interactive= True, visible= True)
-            audio2 = gr.Audio(source="microphone", label="Record Audio", type="filepath",
-                                interactive= True, visible= False)
-            video1 = gr.Video(source="upload", type="filepath", label="Upload Video",
-                                interactive= True, visible= False)
-            video2 = gr.Video(source="webcam", label="Record Video", type="filepath",
-                                interactive= True, visible= False)
-            file_in = gr.File(label="Upload File", interactive= True, visible= False)
-            
-            submit = gr.Button()
-        
-        with gr.Column():
-            
-            out_txt = gr.Textbox(label="Output",
-                                    visible= True, show_copy_button=True)
-            
-            out_json = gr.JSON(label="JSON Output",
-                                visible= False, show_copy_button=True)
-            
-            annoation = gr.Textbox(label="Name your speaker's",
-                                   info= "Please provide a list of the speakers arranged \
-                                   in the order in which they appear in the input. Use comma ',' \
-                                   as a seperator. Be aware that the first name is given \
-                                    to SPEAKER_00 the second to SPEAKER_01 and so on.",
-                                   visible= False, interactive= True)
-            
-            annotate = gr.Button(value="Annotate", visible= False, interactive= True)
-        
-    # Define usage of components
-    input.change(fn=select_origin, inputs=[input],
-                    outputs=[audio1, audio2, video1, video2, file_in])
-    
-    task.change(fn=select_task, inputs=[task],
-                outputs=[num_speakers, translate, language])
-    
-    translate.change(fn= lambda x : gr.update(value = x),
-                        inputs=[translate], outputs=[translate])
-    num_speakers.change(fn= lambda x : gr.update(value = x),
-                        inputs=[num_speakers], outputs=[num_speakers])
-    language.change(fn= lambda x : gr.update(value = x), 
-                    inputs=[language], outputs=[language])
-    
-    submit.click(fn = run_scribe, 
-                    inputs=[task, num_speakers, translate, language, audio1,
-                            audio2, video1, video2, file_in],
-                    outputs=[out_txt, out_json, annoation, annotate])
-    
-    annotate.click(fn = annotate_output, inputs=[annoation, out_json],
-                    outputs=[out_txt, out_json])
-    
-
-demo.queue().launch()
\ No newline at end of file