camenduru
/

pocketsphinx-20.04

Model card Files Files and versions

pocketsphinx-20.04 / examples /live.py

camenduru's picture

pocketsphinx-20.04

37a92a9 about 3 years ago

history blame contribute delete

1.31 kB

	#!/usr/bin/env python3
	"""
	Recognize live speech from the default audio device.
	"""

	# MIT license (c) 2022, see LICENSE for more information.
	# Author: David Huggins-Daines <dhdaines@gmail.com>

	from pocketsphinx import Endpointer, Decoder, set_loglevel
	import subprocess
	import sys
	import os


	def main():
	set_loglevel("INFO")
	ep = Endpointer()
	decoder = Decoder(
	samprate=ep.sample_rate,
	)
	soxcmd = f"sox -q -r {ep.sample_rate} -c 1 -b 16 -e signed-integer -d -t raw -"
	sox = subprocess.Popen(soxcmd.split(), stdout=subprocess.PIPE)
	while True:
	frame = sox.stdout.read(ep.frame_bytes)
	prev_in_speech = ep.in_speech
	speech = ep.process(frame)
	if speech is not None:
	if not prev_in_speech:
	print("Speech start at %.2f" % (ep.speech_start), file=sys.stderr)
	decoder.start_utt()
	decoder.process_raw(speech)
	hyp = decoder.hyp()
	if hyp is not None:
	print("PARTIAL RESULT:", hyp.hypstr, file=sys.stderr)
	if not ep.in_speech:
	print("Speech end at %.2f" % (ep.speech_end), file=sys.stderr)
	decoder.end_utt()
	print(decoder.hyp().hypstr)


	try:
	main()
	except KeyboardInterrupt:
	pass