File size: 980 Bytes
9a199b4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
import sounddevice as sd
import scipy.io.wavfile as wav
import nemo.collections.asr as nemo_asr

# ===== SETTINGS =====
SAMPLE_RATE = 16000
DURATION = 10  # seconds
OUTPUT_FILE = "arabic_recording.wav"

# ===== STEP 1: Record audio =====
print("๐ŸŽ™๏ธ Recording... Speak Arabic now!")
audio = sd.rec(int(SAMPLE_RATE * DURATION), samplerate=SAMPLE_RATE, channels=1, dtype='int16')
sd.wait()
wav.write(OUTPUT_FILE, SAMPLE_RATE, audio)
print(f"โœ… Recording finished. Saved as {OUTPUT_FILE}")

# ===== STEP 2: Load ASR model =====
print("๐Ÿ“ฅ Loading Arabic ASR model...")
asr_model = nemo_asr.models.EncDecCTCModel.restore_from("C:/Users/thegh/Python_Projects/Expertflow/UnderProgress/Peter_Projects/nvidia_asr_eg_conformer_better_than_whisper/stt_ar_fastconformer_hybrid_large_pcd_v1.0.nemo")

# ===== STEP 3: Transcribe =====
print("๐Ÿ” Transcribing...")
transcription = asr_model.transcribe([OUTPUT_FILE])
print("๐Ÿ“ Transcription:", transcription[0])