Python-Scripts/Transcribing/transcription.py at d379240888af8e0a080759fb38e81e03794b5688 · wasmerio/Python-Scripts · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
import sys
import subprocess
import shutil

#functions to install python packages
def installPackage(pkgName):
    print(f"[INFO] {pkgName} not found. Installing...")
    subprocess.check_call([sys.executable, "-m", "pip", "install", pkgName])
    print(f"[INFO] {pkgName} installed successfully!")

try:
    from faster_whisper import WhisperModel
except ImportError:
    installPackage("faster_whisper")
    from faster_whisper import WhisperModel

# Check for ffmpeg
if shutil.which("ffmpeg") is None:
    print(
        "[ERROR] ffmpeg not found on your system.\n"
        "Please install ffmpeg to use this script:\n"
        "- Windows: https://ffmpeg.org/download.html\n"
        "- Linux: sudo apt install ffmpeg\n"
        "- Mac: brew install ffmpeg"
    )
    sys.exit(1)

print("[INFO] All dependencies are ready!")

import os
while True:
    audio_file = input("Enter the name of or path to your audio file (MP3, WAV, MP4 etc.): ").strip()
    if not os.path.isfile(audio_file):
        print(f"[ERROR] File '{audio_file}' does not exist. Please check the path and try again.")
    else:
        break
valid_models = ["tiny", "small", "base", "medium", "large"]
print("Models (Sorted from Fastest-Smallest-Least Accurate To Slowest-Largest-Most Accurate):-\n")
print(valid_models)

while True:
    model_size = input("\nEnter the model size: ").strip().lower()

    if model_size not in valid_models:
        print(f"[ERROR] Invalid model size '{model_size}'. Please choose from {valid_models}.\n")
    else:
        break

model = WhisperModel(model_size)

output_file = audio_file.rsplit(".", 1)[0] + "_transcript.txt"
segments, info = model.transcribe(audio_file)

with open(output_file, "w", encoding="utf-8") as f:
    print("\nTranscribing.")
    for segment in segments:
        print(".", end="", flush=True)
        f.write(segment.text + "\n")
print(f"\n[INFO] Transcription saved to {output_file}")
print("\n -- Scripted by Syed Sultan (github = Syed-56)")