Whisper is OpenAI’s robust speech recognition and transcription model. With InferX, you can run Whisper on any device using the same API - from edge devices to powerful servers.
import osmodel = whisper()# Process multiple audio filesaudio_files = [f for f in os.listdir("audio_folder/") if f.endswith(('.wav', '.mp3', '.m4a'))]for audio_file in audio_files: result = model.inference(audio_path=f"audio_folder/{audio_file}") # Save transcription transcript_file = audio_file.replace('.wav', '.txt').replace('.mp3', '.txt').replace('.m4a', '.txt') with open(f"transcripts/{transcript_file}", 'w') as f: f.write(result['text']) print(f"Processed: {audio_file} -> {transcript_file}")