Spaces:

innocentpeter
/

talkAI

Runtime error

talkAI / stt_engine.py

Upload 9 files

c3a047c verified 3 months ago

1.13 kB

	import torch
	from transformers import pipeline

	class STTEngine:
	def __init__(self, model_name="openai/whisper-small"):
	# Load Whisper pipeline for automatic speech recognition
	device = 0 if torch.cuda.is_available() else -1
	self.asr = pipeline(
	"automatic-speech-recognition",
	model=model_name,
	device=device
	)

	def transcribe(self, audio_path, language="en"):
	"""
	Transcribe audio file to text using Whisper.
	Args:
	audio_path (str): path to .wav file
	language (str): ISO code ('en', 'ha', 'yo', 'ig')
	"""
	if audio_path is None:
	return ""

	# Map Nigerian language names to Whisper codes
	lang_map = {
	"english": "en",
	"hausa": "ha",
	"yoruba": "yo",
	"igbo": "ig",
	"pidgin": "pcm",
	}
	whisper_lang = lang_map.get(language.lower(), "en")

	result = self.asr(audio_path, generate_kwargs={"language": whisper_lang})
	return result["text"].strip()