Spaces:

jeongsoo
/

STT_TTS_chatbot

Paused

App Files Files Community

STT_TTS_chatbot / utils /huggingface_tts.py

jeongsoo

Add application file

5688789 about 1 year ago

raw

history blame contribute delete

3.21 kB

	import os
	import torch
	import torchaudio
	import tempfile
	from transformers import pipeline
	import time
	import warnings


	class HuggingFaceTTS:
	def __init__(self, model_name="facebook/mms-tts-eng"):
	"""
	Hugging Face의 TTS 모델을 사용한 Text-to-Speech 클래스

	Args:
	model_name: 사용할 TTS 모델 이름
	"""
	self.available = False
	self.model_name = model_name

	try:
	# 경고 무시
	warnings.filterwarnings("ignore")

	# 캐시 디렉토리 설정
	cache_dir = os.path.join(tempfile.gettempdir(), "hf_tts_cache")
	os.makedirs(cache_dir, exist_ok=True)

	print(f"[HF TTS] 모델 로드 중: {model_name}, 캐시 디렉토리: {cache_dir}")

	# 모델 로드 (max_new_tokens 및 device 설정 추가)
	start_time = time.time()
	self.synthesizer = pipeline(
	"text-to-speech",
	model=model_name,
	cache_dir=cache_dir,
	device=0 if torch.cuda.is_available() else -1
	)
	elapsed = time.time() - start_time

	self.available = True
	print(f"[HF TTS] 모델({model_name}) 로드 성공! ({elapsed:.1f}초)")
	except Exception as e:
	print(f"[HF TTS] 모델({model_name}) 로드 실패: {e}")
	self.available = False

	def generate_speech(self, text, output_path):
	"""
	텍스트를 음성으로 변환

	Args:
	text: 변환할 텍스트
	output_path: 저장할 파일 경로

	Returns:
	bool: 성공 여부
	"""
	if not self.available:
	return False

	try:
	# 오류 검증 1: 빈 텍스트 확인
	if not text or text.strip() == "":
	print("[HF TTS] 경고: 빈 텍스트가 입력되었습니다")
	text = "No text provided."

	# 오류 검증 2: 텍스트가 너무 길면 잘라냄
	if len(text) > 500:
	print(f"[HF TTS] 텍스트가 너무 깁니다 ({len(text)}자). 500자로 잘라냅니다.")
	text = text[:497] + "..."

	print(f"[HF TTS] 음성 생성 시작: '{text[:50]}...' (전체 {len(text)}자)")

	# 음성 생성
	with warnings.catch_warnings():
	warnings.simplefilter("ignore")
	speech = self.synthesizer(text)

	# 파일 저장 확인
	file_path = output_path
	with open(file_path, "wb") as f:
	f.write(speech["audio"])

	# 파일 생성 확인
	if os.path.exists(file_path) and os.path.getsize(file_path) > 0:
	print(f"[HF TTS] 음성 파일 저장 성공: {file_path}, 크기: {os.path.getsize(file_path)} 바이트")
	return True
	else:
	print(f"[HF TTS] 오류: 파일이 저장되지 않았거나 비어 있습니다: {file_path}")
	return False

	except Exception as e:
	print(f"[HF TTS] 음성 생성 중 오류 발생: {e}")
	return False