Spaces:

jeongsoo
/

STT_TTS_chatbot

Paused

App Files Files Community

STT_TTS_chatbot / utils /hf_hub_tts.py

jeongsoo

Add application file

10c1a86 about 1 year ago

raw

history blame contribute delete

2.46 kB

	import os
	import torch
	import tempfile
	import time
	from huggingface_hub import hf_hub_download
	import torchaudio


	class HFHubTTS:
	"""Hugging Face Hub에서 직접 TTS 모델을 로드하는 클래스"""

	def __init__(self, model_id="facebook/mms-tts-eng"):
	"""
	Hugging Face Hub에서 TTS 모델 초기화

	Args:
	model_id: 사용할 모델 ID (기본값: "facebook/mms-tts-eng")
	"""
	self.available = False
	self.model_id = model_id

	try:
	from transformers import pipeline

	print(f"[HF Hub TTS] 모델 로드 중: {model_id}")
	start_time = time.time()

	# 모델 로드
	self.tts = pipeline("text-to-speech", model=model_id)

	elapsed = time.time() - start_time
	self.available = True
	print(f"[HF Hub TTS] 모델 '{model_id}' 로드 성공! ({elapsed:.1f}초)")
	except Exception as e:
	print(f"[HF Hub TTS] 모델 '{model_id}' 로드 실패: {e}")
	self.available = False

	def generate_speech(self, text, output_path):
	"""
	텍스트를 음성으로 변환

	Args:
	text: 변환할 텍스트
	output_path: 저장할 파일 경로

	Returns:
	bool: 성공 여부
	"""
	if not self.available:
	return False

	try:
	# 텍스트 검증
	if not text or len(text.strip()) == 0:
	print("[HF Hub TTS] 빈 텍스트가 입력되었습니다.")
	return False

	print(f"[HF Hub TTS] 음성 생성 시작: '{text[:50]}{'...' if len(text) > 50 else ''}'")
	start_time = time.time()

	# 음성 생성
	speech = self.tts(text)

	# 파일 저장
	with open(output_path, "wb") as f:
	f.write(speech["audio"])

	elapsed = time.time() - start_time

	# 결과 확인
	if os.path.exists(output_path) and os.path.getsize(output_path) > 0:
	print(f"[HF Hub TTS] 음성 생성 성공: {output_path} ({elapsed:.1f}초)")
	return True
	else:
	print(f"[HF Hub TTS] 음성 파일이 생성되지 않았습니다.")
	return False

	except Exception as e:
	print(f"[HF Hub TTS] 음성 생성 중 오류 발생: {e}")
	return False