import whisper import sys input_file = sys.argv[1] model = whisper.load_model("small") # You can also try "base", "small", "medium" result = model.transcribe(input_file, verbose=True) print(input_file) print(result["text"])