Auto-update: Tue Feb 11 14:35:32 PST 2025
This commit is contained in:
parent
758b8ef136
commit
c91189d181
1 changed files with 0 additions and 48 deletions
48
mlx
48
mlx
|
@ -1,48 +0,0 @@
|
|||
#!/usr/bin/env python3
|
||||
|
||||
import argparse
|
||||
import os
|
||||
import sys
|
||||
import tempfile
|
||||
import subprocess
|
||||
from lightning_whisper_mlx import LightningWhisperMLX
|
||||
|
||||
def convert_to_mp3(input_path):
|
||||
"""Convert input file to MP3 using ffmpeg if necessary, storing in a temporary directory."""
|
||||
if input_path.lower().endswith(".mp3"):
|
||||
return input_path # No conversion needed
|
||||
|
||||
temp_dir = tempfile.mkdtemp()
|
||||
output_path = os.path.join(temp_dir, "converted.mp3")
|
||||
|
||||
try:
|
||||
subprocess.run(["ffmpeg", "-y", "-i", input_path, "-q:a", "2", output_path],
|
||||
check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
|
||||
except subprocess.CalledProcessError:
|
||||
sys.exit("Error: Failed to convert file to MP3. Ensure ffmpeg is installed.")
|
||||
|
||||
return output_path
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser(description="Transcribe or translate audio using LightningWhisperMLX.")
|
||||
parser.add_argument("file", help="Path to the audio file.")
|
||||
parser.add_argument("--translate", action="store_true", help="Enable translation mode.")
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
audio_path = convert_to_mp3(args.file)
|
||||
|
||||
# Selecting a valid model
|
||||
whisper = LightningWhisperMLX(model="large-v3", batch_size=12, quant=None)
|
||||
|
||||
if args.translate:
|
||||
print("Translation mode enabled.")
|
||||
result = whisper.transcribe(audio_path=audio_path, language="en") # Explicitly setting language to English
|
||||
else:
|
||||
result = whisper.transcribe(audio_path=audio_path)
|
||||
|
||||
print(result['text'])
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
|
Loading…
Add table
Reference in a new issue