alaatiger989
/

Ambulance_App_ASR_Detection

Model card Files Files and versions

Ambulance_App_ASR_Detection / main.py

alaatiger989's picture

Upload folder using huggingface_hub

9a199b4 verified 4 months ago

history blame contribute delete

980 Bytes

	import sounddevice as sd
	import scipy.io.wavfile as wav
	import nemo.collections.asr as nemo_asr

	# ===== SETTINGS =====
	SAMPLE_RATE = 16000
	DURATION = 10 # seconds
	OUTPUT_FILE = "arabic_recording.wav"

	# ===== STEP 1: Record audio =====
	print("🎙️ Recording... Speak Arabic now!")
	audio = sd.rec(int(SAMPLE_RATE * DURATION), samplerate=SAMPLE_RATE, channels=1, dtype='int16')
	sd.wait()
	wav.write(OUTPUT_FILE, SAMPLE_RATE, audio)
	print(f"✅ Recording finished. Saved as {OUTPUT_FILE}")

	# ===== STEP 2: Load ASR model =====
	print("📥 Loading Arabic ASR model...")
	asr_model = nemo_asr.models.EncDecCTCModel.restore_from("C:/Users/thegh/Python_Projects/Expertflow/UnderProgress/Peter_Projects/nvidia_asr_eg_conformer_better_than_whisper/stt_ar_fastconformer_hybrid_large_pcd_v1.0.nemo")

	# ===== STEP 3: Transcribe =====
	print("🔍 Transcribing...")
	transcription = asr_model.transcribe([OUTPUT_FILE])
	print("📝 Transcription:", transcription[0])