Add files via upload

2022-12-20 13:54:29 +01:00
parent 085b3180e5
commit 60ef9c0db8
9 changed files with 340 additions and 0 deletions
@@ -0,0 +1,4 @@
+from autotranscript.__main__ import *
+from autotranscript.version import get_version as _get_version
+
+__version__ = _get_version()
@@ -0,0 +1,126 @@
+
+import whisper
+from time import time
+import os
+from moviepy.editor import *
+from typing import Union
+
+class Transcribe:
+    def __init__(self, audiofile : Union[bool, str, list] = None, model : str =  "medium", language :str =  "German"):
+        """
+         Class to autotranscript audio and video files with the Whisper model
+        :param audiofile: audio file or list of audio files
+        :param model: model to use for transcription
+        :param language: language of the audio file
+        """
+
+        self.audiofile = audiofile
+
+        self.language = language
+
+        """
+        Create folder structure
+        """
+
+        self.currentpath,\
+            self.audiopath,\
+            self.transcriptionpath,\
+            self.audiofiles = self.create_folder_structure() # create folder structure
+
+        print("loading model")
+        self.model = whisper.load_model(model)  # load model
+        print("model loaded")
+
+    def create_folder_structure(self):
+        """
+        Create folder structure for audio and transcription files
+
+        :return:  currentpath, audiopath, transcriptionpath, audiofiles
+        """
+        currentpath = os.getcwd() # get current path
+
+        if not os.path.exists(os.path.join(currentpath, 'audiofiles')):
+            print('Creating audiofiles folder')
+            os.makedirs(os.path.join(currentpath, 'audiofiles'))
+        if not os.path.exists(os.path.join(currentpath, 'transcription')):
+            print('Creating transcription folder')
+            os.makedirs(os.path.join(currentpath, 'transcription'))
+
+        audiopath = os.path.join(currentpath, 'audiofiles')  # path to audio files
+        transcriptionpath = os.path.join(currentpath, 'transcription') # path to transcription files
+
+        audiofiles = os.listdir(audiopath) # list of audio files
+
+        return currentpath, audiopath, transcriptionpath, audiofiles
+
+    def video_to_audio(self,file,  remove_video=True):
+        clip = VideoFileClip(file)
+        clip.audio.write_audiofile(os.path.join(file[:-4] + '.mp3'))
+        if remove_video:
+            os.remove(file)
+            print(f'Video {file} removed')
+        return os.path.join(file[:-4] + '.mp3')
+
+
+    def transcribe(self):
+
+        if self.audiofile is not None:
+            if self.audiofile in self.audiofiles:
+                audiofile = os.path.join(self.audiopath, self.audiofile)
+            else:
+                raise ValueError('Audio file not found')
+
+            if audiofile.endswith('.mp4'):
+                print('Converting video to audio')
+                audiofile = self.video_to_audio(audiofile)
+
+            print(f'Start transcribing Audio file: {audiofile}')
+            _stime = time()
+            result = self.model.transcribe(audiofile, verbose=True, language= self.language)
+
+            print(f'Transcription finished in {time() - _stime} seconds')
+
+            txtfilename = str(audiofile.split('/')[-1][:-4]) + '.txt'
+
+            savepath = os.path.join(self.transcriptionpath, txtfilename)
+
+            with open(savepath, 'w') as f:
+                f.write(result["text"])
+        elif self.audiofile is None or isinstance(self.audiofile, list):
+            print('No audio file specified or list of audio files')
+            print(f"{len(self.audiofiles)} audio files found in {self.audiopath}")
+            print("Start transcribing all audio files")
+            i = 0
+            for audiofile in self.audiofiles:
+
+                audiofile = os.path.join(self.audiopath, audiofile)
+
+                if audiofile.endswith('.mp4'):
+                    audiofile = self.video_to_audio(audiofile)
+
+                print(f'Start transcribing Audio file: {audiofile}')
+                _stime = time()
+                result = self.model.transcribe(audiofile, verbose=True, language=self.language)
+                print(f'Transcription finished in {time() - _stime} seconds')
+
+                txtfilename = str(audiofile.split('/')[-1][:-4]) + '.txt'
+
+                savepath = os.path.join(self.transcriptionpath, txtfilename)
+
+                with open(savepath, 'w') as f:
+                    f.write(result["text"])
+
+                i += 1
+                print(f'{i} of {len(self.audiofiles)} files transcribed')
+
+        else:
+            raise ValueError('Audio file not found')
+
+        print('Transcription finished')
+
+    def __call__(self):
+        return self.transcribe()
+    def __repr__(self):
+        return f"Transcribe(audiofile={self.audiofile}, model={self.model}, language={self.language})"
+    def __str__(self):
+        return f"Transcribe(audiofile={self.audiofile}, model={self.model}, language={self.language})"
@@ -0,0 +1,69 @@
+import os
+import subprocess as sp
+
+MAJOR = 1
+MINOR = 0
+MICRO = 0
+MICRO_POST = 0
+ISRELEASED = False
+VERSION = '%d.%d.%d.%d' % (MAJOR, MINOR, MICRO, MICRO_POST)
+
+# Return the git revision as a string
+# taken from numpy/numpy
+def git_version():
+    def _minimal_ext_cmd(cmd):
+        # construct minimal environment
+        env = {}
+        for k in ['SYSTEMROOT', 'PATH', 'HOME']:
+            v = os.environ.get(k)
+            if v is not None:
+                env[k] = v
+
+        # LANGUAGE is used on win32
+        env['LANGUAGE'] = 'C'
+        env['LANG'] = 'C'
+        env['LC_ALL'] = 'C'
+
+        out = sp.Popen(cmd, stdout=sp.PIPE, stderr=sp.PIPE, env=env).communicate()[0]
+        return out
+
+    try:
+        out = _minimal_ext_cmd(['git', 'rev-parse', 'HEAD'])
+        GIT_REVISION = out.strip().decode('ascii')
+    except OSError:
+        GIT_REVISION = "Unknown"
+
+    return GIT_REVISION
+
+def _get_git_version():
+    cwd = os.getcwd()
+
+    # go to the main directory
+    fdir = os.path.dirname(os.path.abspath(__file__))
+    maindir = os.path.abspath(os.path.join(fdir, ".."))
+    # maindir = fdir # os.path.join(fdir, "..")
+    os.chdir(maindir)
+
+    # get git version
+    res = git_version()
+
+    # restore the cwd
+    os.chdir(cwd)
+    return res
+
+def get_version(build_version=False):
+    if ISRELEASED:
+        return VERSION
+
+    # unreleased version
+    GIT_REVISION = _get_git_version()
+
+    if build_version:
+        import datetime as dt
+        date = dt.date.strftime(dt.datetime.now(), "%Y%m%d%H%M%S")
+        return VERSION + ".dev" + date
+    else:
+        return VERSION + ".dev0+" + GIT_REVISION[:7]
+
+
+
@@ -0,0 +1,96 @@
+name: whisper
+channels:
+  - pytorch
+  - conda-forge
+  - defaults
+dependencies:
+  - _libgcc_mutex=0.1=main
+  - _openmp_mutex=5.1=1_gnu
+  - blas=1.0=mkl
+  - bzip2=1.0.8=h7b6447c_0
+  - ca-certificates=2022.10.11=h06a4308_0
+  - certifi=2022.9.24=py39h06a4308_0
+  - cudatoolkit=11.3.1=h9edb442_10
+  - ffmpeg=4.2.2=h20bf706_0
+  - freetype=2.12.1=h4a9f257_0
+  - giflib=5.2.1=h7b6447c_0
+  - gmp=6.2.1=h295c915_3
+  - gnutls=3.6.15=he1e5248_0
+  - intel-openmp=2021.4.0=h06a4308_3561
+  - jpeg=9e=h7f8727e_0
+  - lame=3.100=h7b6447c_0
+  - lcms2=2.12=h3be6417_0
+  - ld_impl_linux-64=2.38=h1181459_1
+  - lerc=3.0=h295c915_0
+  - libdeflate=1.8=h7f8727e_5
+  - libffi=3.3=he6710b0_2
+  - libgcc-ng=11.2.0=h1234567_1
+  - libgomp=11.2.0=h1234567_1
+  - libidn2=2.3.2=h7f8727e_0
+  - libopus=1.3.1=h7b6447c_0
+  - libpng=1.6.37=hbc83047_0
+  - libstdcxx-ng=11.2.0=h1234567_1
+  - libtasn1=4.16.0=h27cfd23_0
+  - libtiff=4.4.0=hecacb30_2
+  - libunistring=0.9.10=h27cfd23_0
+  - libuv=1.40.0=h7b6447c_0
+  - libvpx=1.7.0=h439df22_0
+  - libwebp=1.2.4=h11a3e52_0
+  - libwebp-base=1.2.4=h5eee18b_0
+  - lz4-c=1.9.3=h295c915_1
+  - mkl=2021.4.0=h06a4308_640
+  - mkl-service=2.4.0=py39h7f8727e_0
+  - mkl_fft=1.3.1=py39hd3c417c_0
+  - mkl_random=1.2.2=py39h51133e4_0
+  - ncurses=6.3=h5eee18b_3
+  - nettle=3.7.3=hbbd107a_1
+  - numpy=1.23.4=py39h14f4228_0
+  - numpy-base=1.23.4=py39h31eccc5_0
+  - openh264=2.1.1=h4ff587b_0
+  - openssl=1.1.1s=h7f8727e_0
+  - pillow=9.2.0=py39hace64e9_1
+  - pip=22.2.2=py39h06a4308_0
+  - python=3.9.15=haa1d7c7_0
+  - pytorch=1.10.1=py3.9_cuda11.3_cudnn8.2.0_0
+  - pytorch-mutex=1.0=cuda
+  - readline=8.2=h5eee18b_0
+  - setuptools=65.5.0=py39h06a4308_0
+  - six=1.16.0=pyhd3eb1b0_1
+  - sqlite=3.39.3=h5082296_0
+  - tk=8.6.12=h1ccaba5_0
+  - torchaudio=0.10.1=py39_cu113
+  - torchvision=0.11.2=py39_cu113
+  - typing_extensions=4.3.0=py39h06a4308_0
+  - tzdata=2022f=h04d1e81_0
+  - wheel=0.37.1=pyhd3eb1b0_0
+  - x264=1!157.20191217=h7b6447c_0
+  - xz=5.2.6=h5eee18b_0
+  - zlib=1.2.13=h5eee18b_0
+  - zstd=1.5.2=ha4553b6_0
+  - pip:
+    - charset-normalizer==2.1.1
+    - decorator==4.4.2
+    - ffmpeg-python==0.2.0
+    - filelock==3.8.0
+    - future==0.18.2
+    - huggingface-hub==0.11.0
+    - idna==3.4
+    - imageio==2.23.0
+    - imageio-ffmpeg==0.4.7
+    - more-itertools==9.0.0
+    - moviepy==1.0.3
+    - packaging==21.3
+    - proglog==0.1.10
+    - pydub==0.25.1
+    - pyparsing==3.0.9
+    - pyyaml==6.0
+    - regex==2022.10.31
+    - requests==2.28.1
+    - semantic-version==2.10.0
+    - setuptools-rust==1.5.2
+    - tokenizers==0.13.2
+    - tqdm==4.64.1
+    - transformers==4.24.0
+    - urllib3==1.26.12
+    - whisper==1.0
+prefix: /home/jacob/anaconda3/envs/whisper
@@ -0,0 +1,3 @@
+whisper~=1.0
+moviepy~=1.0.3
+setuptools~=65.5.0
@@ -0,0 +1,38 @@
+import pkg_resources
+import os
+from setuptools import setup, find_packages
+
+module_name = "autotranscript"
+github_url = "https://github.com/Jaikinator/transcriptor"
+
+file_dir = os.path.dirname(os.path.realpath(__file__))
+absdir = lambda p: os.path.join(file_dir, p)
+
+############### versioning ###############
+verfile = os.path.abspath(os.path.join(module_name, "version.py"))
+version = {"__file__": verfile}
+
+with open(verfile, "r") as fp:
+    exec(fp.read(), version)
+
+############### setup ###############
+
+build_version = "OPTB_BUILD" in os.environ
+
+setup(
+    name=module_name,
+    version=version["get_version"](build_version),
+    packages=find_packages(),
+    python_requires="~=3.9",
+    readme="README.md",
+    install_requires = [str(r) for r in pkg_resources.parse_requirements(
+            open(os.path.join(os.path.dirname(__file__), "requirements.txt"))
+        )
+    ],
+    url= github_url,
+    license='',
+    author='Jacob Schmieder',
+    author_email='',
+    description='Transcription tool for audio files based on Whisper',
+    #entry_points={'console_scripts': ['autotranscript = autotranscript.__main__:main']}
+)
@@ -0,0 +1,4 @@
+from autotranscript import Transcribe
+
+Transcribe().transcribe()
+