Spaces:

mr-don88
/

ELEVENLAB

Paused

App Files Files Community

ELEVENLAB / app.py

mr-don88

Update app.py

baa7af5 verified 7 months ago

raw

history blame

108 kB

	import spaces
	from vansarah import KModel, KPipeline
	import gradio as gr
	import torch
	import numpy as np
	import wave
	import io
	import time
	import re
	import json
	from typing import List, Tuple, Optional, Dict
	from pydub import AudioSegment
	from pydub.effects import normalize, compress_dynamic_range, low_pass_filter, high_pass_filter
	import os
	import random
	from phonemizer import backend
	from datetime import timedelta

	# Tokenizer class with enhanced text processing
	class Tokenizer:
	def __init__(self):
	self.VOCAB = self._get_vocab()
	self.special_cases = self._build_special_cases()
	self.special_regex = self._build_special_regex()
	self.abbreviation_patterns = self._build_abbreviation_patterns()
	self.phonemizers = {
	'en-us': backend.EspeakBackend(language='en-us', preserve_punctuation=True, with_stress=True),
	'en-gb': backend.EspeakBackend(language='en-gb', preserve_punctuation=True, with_stress=True),
	}

	@staticmethod
	def _get_vocab():
	_pad = "$"
	_punctuation = ';:,.!?¡¿—…"«»“” '
	_letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz'
	_letters_ipa = "ɑɐɒæɓʙβɔɕçɗɖðʤəɘɚɛɜɝɞɟʄɡɠɢʛɦɧħɥʜɨɪʝɭɬɫɮʟɱɯɰŋɳɲɴøɵɸθœɶʘɹɺɾɻʀʁɽʂʃʈʧʉʊʋⱱʌɣɤʍχʎʏʑʐʒʔʡʕʢǀǁǂǃˈˌːˑʼʴʰʱʲʷˠˤ˞↓↑→↗↘'̩'ᵻ"
	symbols = [_pad] + list(_punctuation) + list(_letters) + list(_letters_ipa)
	return {symbol: index for index, symbol in enumerate(symbols)}


	def _build_special_cases(self) -> Dict[str, str]:
	"""Từ điển các từ đặc biệt cần chuẩn hóa cách đọc"""
	cases = {
	# 1. Đại từ nhân xưng
	"I": "I", "me": "me", "my": "my", "mine": "mine", "myself": "myself",
	"you": "you", "your": "your", "yours": "yours", "yourself": "yourself",
	"he": "he", "him": "him", "his": "his", "himself": "himself",
	"she": "she", "her": "her", "hers": "hers", "herself": "herself",
	"we": "we", "us": "us", "our": "our", "ours": "ours", "ourselves": "ourselves",
	"they": "they", "them": "them", "their": "their", "theirs": "theirs",
	"it": "it", "its": "its", "itself": "itself",
	"yourselves": "yourselves", "oneself": "oneself",

	# 2. Động từ to be/trợ động từ
	"is": "is", "are": "are", "am": "am", "was": "was", "were": "were",
	"be": "be", "been": "been", "being": "being", "have": "have",
	"has": "has", "had": "had", "do": "do", "does": "does", "did": "did",
	"can": "can", "could": "could", "will": "will", "would": "would",
	"shall": "shall", "should": "should", "may": "may", "might": "might",
	"must": "must", "ought": "ought", "dare": "dare", "need": "need",
	"used": "used", "going": "going",

	# 3. Giới từ/Liên từ
	"and": "AND", "or": "or", "but": "but", "for": "for", "nor": "nor",
	"yet": "yet", "so": "so", "the": "the", "a": "a", "an": "an",
	"this": "this", "that": "that", "these": "these", "those": "those",
	"in": "in", "on": "on", "at": "at", "by": "by", "with": "with",
	"without": "without", "to": "to", "from": "from", "of": "of",
	"about": "about", "as": "as", "like": "like", "up": "up", "down": "down",
	"over": "over", "under": "under", "between": "between", "among": "among",
	"through": "through", "during": "during", "before": "before",
	"after": "after", "above": "above", "below": "below", "near": "near",
	"since": "since", "until": "until", "while": "while", "although": "although",
	"though": "though", "whether": "whether", "unless": "unless",
	"because": "because", "if": "if", "than": "than", "once": "once",

	# 4. Trạng từ/Phó từ
	"not": "not", "also": "also", "very": "very", "too": "too",
	"just": "just", "only": "only", "even": "even", "now": "now",
	"then": "then", "here": "here", "there": "there", "always": "always",
	"never": "never", "sometimes": "sometimes", "usually": "usually",
	"often": ", often", "rarely": "rarely", "seldom": "seldom",
	"already": "already", "yet": "yet", "still": "still", "almost": "almost",
	"enough": "enough", "quite": "quite", "rather": "rather",
	"maybe": "maybe", "perhaps": "perhaps", "probably": "probably",
	"absolutely": "absolutely", "completely": "completely", "totally": "totally",
	"utterly": "utterly", "literally": "literally", "basically": "basically",
	"actually": "actually", "certainly": "certainly", "clearly": "clearly",
	"obviously": "obviously", "possibly": "possibly", "surely": "surely",

	# 5. Từ để hỏi
	"what": "what", "when": "when", "where": "where", "why": "why",
	"how": "how", "who": "who", "whom": "whom", "whose": "whose",
	"which": "which", "whether": "whether",

	# 6. Từ cảm thán
	"oh": "oh", "wow": "wow", "ouch": "ouch", "oops": "oops",
	"hey": "hey", "hi": "hi", "hello": "hello", "goodbye": "goodbye",
	"please": "please", "thanks": "thanks", "thank you": "thank you",
	"sorry": "sorry", "yes": "yes", "no": "no", "okay": "okay",

	# 9. Từ thông dụng khác
	"course": ", course", "keep": "KEEP", "Welcome": "WELCOM",
	"really": "REALLY", "ok": "okay", "okay": "okay", "good": "good",
	"bad": "bad", "new": "new", "old": "old", "first": "first",
	"last": "last", "great": "great", "small": "small", "big": "big",
	"high": "high", "low": "low", "next": "next", "same": "same",
	"different": "different", "another": "another", "each": "each",
	"every": "every", "few": "few", "many": "many", "most": "most",
	"much": "much", "some": "some", "such": "such", "all": "all",
	"any": "any", "both": "both", "either": "either", "neither": "neither",
	"none": "none", "own": "own", "other": "other", "rather": "rather",
	"several": "several", "half": "half", "whole": "whole",
	"true": "true", "false": "false", "right": "right", "wrong": "wrong",
	"important": "important", "interesting": "interesting",
	"necessary": "necessary", "possible": "possible",
	"beautiful": "beautiful", "wonderful": "wonderful",
	"excellent": "excellent", "perfect": "perfect",
	"awesome": "awesome", "terrible": "terrible",
	"horrible": "horrible", "delicious": "delicious",
	"important": "important", "special": "special",
	"amazing": "amazing", "incredible": "incredible",
	"unbelievable": "unbelievable", "serious": "serious",
	"funny": "funny", "happy": "happy", "sad": "sad",
	"angry": "angry", "surprised": "surprised",
	"excited": "excited", "bored": "bored", "tired": "tired",
	"hungry": "hungry", "thirsty": "thirsty", "ready": "ready",
	"busy": "busy", "free": "free", "open": "open", "closed": "closed",
	"easy": "easy", "difficult": "difficult", "simple": "simple",
	"complex": "complex", "clean": "clean", "dirty": "dirty",
	"early": "early", "late": "late", "fast": "fast", "slow": "slow",
	"hot": "hot", "cold": "cold", "warm": "warm", "cool": "cool",
	"light": "light", "dark": "dark", "noisy": "noisy", "quiet": "quiet",
	"expensive": "expensive", "cheap": "cheap", "rich": "rich",
	"poor": "poor", "strong": "strong", "weak": "weak", "healthy": "healthy",
	"sick": "sick", "dead": "dead", "alive": "alive", "real": "real",
	"fake": "fake", "modern": "modern", "ancient": "ancient",
	"young": "young", "future": "future", "past": "past",
	"present": "present", "current": "current", "recent": "recent",
	"immediate": "immediate", "sudden": "sudden", "final": "final",
	"initial": "initial", "primary": "primary", "secondary": "secondary",
	"main": "main", "major": "major", "minor": "minor",
	"average": "average", "normal": "normal", "usual": "usual",
	"unusual": "unusual", "common": "common", "rare": "rare",
	"unique": "unique", "strange": "strange", "odd": "odd",
	"typical": "typical", "traditional": "traditional",
	"original": "original", "basic": "basic", "advanced": "advanced",
	"professional": "professional", "personal": "personal",
	"private": "private", "public": "public", "national": "national",
	"international": "international", "local": "local",
	"global": "global", "general": "general", "specific": "specific",
	"particular": "particular", "special": "special",
	"especial": "especial", "various": "various", "several": "several",
	"numerous": "numerous", "countless": "countless", "endless": "endless",
	"limited": "limited", "unlimited": "unlimited", "enough": "enough",
	"plenty": "plenty", "extra": "extra", "additional": "additional",
	"further": "further", "following": "following", "previous": "previous",
	"former": "former", "latter": "latter", "upper": "upper",
	"lower": "lower", "inner": "inner", "outer": "outer",
	"external": "external", "internal": "internal", "central": "central",
	"middle": "middle", "intermediate": "intermediate", "direct": "direct",
	"indirect": "indirect", "positive": "positive", "negative": "negative",
	"neutral": "neutral", "active": "active", "passive": "passive",
	"constant": "constant", "variable": "variable", "regular": "regular",
	"irregular": "irregular", "proper": "proper", "improper": "improper",
	"correct": "correct", "incorrect": "incorrect", "accurate": "accurate",
	"inaccurate": "inaccurate", "exact": "exact", "approximate": "approximate",
	"precise": "precise", "vague": "vague", "clear": "clear",
	"unclear": "unclear", "obvious": "obvious", "apparent": "apparent",
	"transparent": "transparent", "opaque": "opaque", "visible": "visible",
	"invisible": "invisible", "audible": "audible", "inaudible": "inaudible",
	"tangible": "tangible", "intangible": "intangible", "physical": "physical",
	"mental": "mental", "emotional": "emotional", "spiritual": "spiritual",
	"intellectual": "intellectual", "psychological": "psychological",
	"social": "social", "cultural": "cultural", "political": "political",
	"economic": "economic", "financial": "financial", "commercial": "commercial",
	"industrial": "industrial", "technological": "technological",
	"scientific": "scientific", "medical": "medical", "legal": "legal",
	"official": "official", "unofficial": "unofficial", "formal": "formal",
	"informal": "informal", "casual": "casual", "natural": "natural",
	"artificial": "artificial", "synthetic": "synthetic", "organic": "organic",
	"inorganic": "inorganic", "genuine": "genuine", "fake": "fake",
	"authentic": "authentic", "counterfeit": "counterfeit", "valid": "valid",
	"invalid": "invalid", "void": "void", "null": "null", "empty": "empty",
	"full": "full", "complete": "complete", "incomplete": "incomplete",
	"partial": "partial", "total": "total", "entire": "entire",
	"whole": "whole", "half": "half", "quarter": "quarter",
	"third": "third", "fourth": "fourth", "fifth": "fifth",
	"sixth": "sixth", "seventh": "seventh", "eighth": "eighth",
	"ninth": "ninth", "tenth": "tenth", "hundredth": "hundredth",
	"thousandth": "thousandth", "millionth": "millionth",
	"billionth": "billionth", "trillionth": "trillionth",
	"single": "single", "double": "double", "triple": "triple",
	"quadruple": "quadruple", "quintuple": "quintuple",
	"sextuple": "sextuple", "septuple": "septuple", "octuple": "octuple",
	"nonuple": "nonuple", "decuple": "decuple", "multiple": "multiple",
	"manifold": "manifold", "various": "various", "diverse": "diverse",
	"different": "different", "similar": "similar", "alike": "alike",
	"identical": "identical", "same": "same", "equal": "equal",
	"equivalent": "equivalent", "parallel": "parallel", "perpendicular": "perpendicular",
	"horizontal": "horizontal", "vertical": "vertical", "diagonal": "diagonal",
	"straight": "straight", "curved": "curved", "circular": "circular",
	"spherical": "spherical", "square": "square", "rectangular": "rectangular",
	"triangular": "triangular", "round": "round", "oval": "oval",
	"flat": "flat", "smooth": "smooth", "rough": "rough", "soft": "soft",
	"hard": "hard", "flexible": "flexible", "rigid": "rigid",
	"elastic": "elastic", "plastic": "plastic", "liquid": "liquid",
	"solid": "solid", "gaseous": "gaseous", "fluid": "fluid",
	"viscous": "viscous", "dense": "dense", "thin": "thin",
	"thick": "thick", "shallow": "shallow", "deep": "deep",
	"narrow": "narrow", "wide": "wide", "broad": "broad",
	"long": "long", "short": "short", "tall": "tall", "huge": "huge",
	"tiny": "tiny", "giant": "giant", "gigantic": "gigantic",
	"enormous": "enormous", "immense": "immense", "vast": "vast",
	"colossal": "colossal", "massive": "massive", "monumental": "monumental",
	"tremendous": "tremendous", "stupendous": "stupendous",
	"prodigious": "prodigious", "marvelous": "marvelous",
	"wonderful": "wonderful", "fantastic": "fantastic",
	"fabulous": "fabulous", "terrific": "terrific", "superb": "superb",
	"splendid": "splendid", "magnificent": "magnificent",
	"glorious": "glorious", "divine": "divine", "heavenly": "heavenly",
	"celestial": "celestial", "terrestrial": "terrestrial",
	"earthly": "earthly", "mundane": "mundane", "worldly": "worldly",
	"human": "human", "humane": "humane", "animal": "animal",
	"vegetable": "vegetable", "mineral": "mineral", "metallic": "metallic",
	"wooden": "wooden", "glass": "glass", "plastic": "plastic",
	"rubber": "rubber", "cloth": "cloth", "paper": "paper",
	"leather": "leather", "fur": "fur", "wool": "wool", "silk": "silk",
	"cotton": "cotton", "linen": "linen", "nylon": "nylon",
	"polyester": "polyester", "rayon": "rayon", "acrylic": "acrylic",
	"spandex": "spandex", "denim": "denim", "velvet": "velvet",
	"satin": "satin", "lace": "lace", "tulle": "tulle",
	"chiffon": "chiffon", "taffeta": "taffeta", "organza": "organza",
	"georgette": "georgette", "crepe": "crepe", "jersey": "jersey",
	"tweed": "tweed", "corduroy": "corduroy", "flannel": "flannel",
	"cashmere": "cashmere", "angora": "angora", "mohair": "mohair",
	"alpaca": "alpaca", "llama": "llama", "camel": "camel",
	"vicuna": "vicuna", "guanaco": "guanaco", "bison": "bison",
	"buffalo": "buffalo", "yak": "yak", "muskox": "muskox",
	"qiviut": "qiviut", "chiengora": "chiengora", "dog": "dog",
	"cat": "cat", "horse": "horse", "cow": "cow", "pig": "pig",
	"sheep": "sheep", "goat": "goat", "chicken": "chicken",
	"duck": "duck", "goose": "goose", "turkey": "turkey",
	"rabbit": "rabbit", "deer": "deer", "moose": "moose",
	"elk": "elk", "caribou": "caribou", "reindeer": "reindeer",
	"antelope": "antelope", "gazelle": "gazelle", "impala": "impala",
	"springbok": "springbok", "oryx": "oryx", "addax": "addax",
	"kudu": "kudu", "eland": "eland", "nyala": "nyala", "bongo": "bongo",
	"sable": "sable", "roan": "roan", "waterbuck": "waterbuck",
	"lechwe": "lechwe", "puku": "puku", "sitatunga": "sitatunga",
	"bushbuck": "bushbuck", "duiker": "duiker", "klipspringer": "klipspringer",
	"steenbok": "steenbok", "grysbok": "grysbok", "dikdik": "dikdik",
	"sun": "sun", "moon": "moon", "star": "star", "planet": "planet",
	"comet": "comet", "asteroid": "asteroid", "meteor": "meteor",
	"meteorite": "meteorite", "meteoroid": "meteoroid", "galaxy": "galaxy",
	"universe": "universe", "cosmos": "cosmos", "space": "space",
	"time": "time", "light": "light", "dark": "dark", "energy": "energy",
	"matter": "matter", "atom": "atom", "molecule": "molecule",
	"element": "element", "compound": "compound", "mixture": "mixture",
	"solution": "solution", "suspension": "suspension",
	"colloid": "colloid", "emulsion": "emulsion", "foam": "foam",
	"aerosol": "aerosol", "gel": "gel", "sol": "sol", "solid": "solid",
	"liquid": "liquid", "gas": "gas", "plasma": "plasma",
	"crystal": "crystal", "powder": "powder", "granule": "granule",
	"particle": "particle", "grain": "grain", "pebble": "pebble",
	"stone": "stone", "rock": "rock", "boulder": "boulder",
	"sand": "sand", "soil": "soil", "clay": "clay", "mud": "mud",
	"dust": "dust", "dirt": "dirt", "earth": "earth", "ground": "ground",
	"land": "land", "terrain": "terrain", "topography": "topography",
	"geography": "geography", "geology": "geology", "ocean": "ocean",
	"sea": "sea", "lake": "lake", "river": "river", "stream": "stream",
	"creek": "creek", "brook": "brook", "pond": "pond", "pool": "pool",
	"puddle": "puddle", "swamp": "swamp", "marsh": "marsh",
	"bog": "bog", "fen": "fen", "wetland": "wetland", "delta": "delta",
	"estuary": "estuary", "lagoon": "lagoon", "fjord": "fjord",
	"bay": "bay", "gulf": "gulf", "harbor": "harbor", "port": "port",
	"dock": "dock", "pier": "pier", "wharf": "wharf", "quay": "quay",
	"marina": "marina", "canal": "canal", "channel": "channel",
	"strait": "strait", "sound": "sound", "inlet": "inlet",
	"cove": "cove", "beach": "beach", "shore": "shore",
	"coast": "coast", "bank": "bank", "cliff": "cliff",
	"bluff": "bluff", "dune": "dune", "hill": "hill",
	"mountain": "mountain", "valley": "valley", "canyon": "canyon",
	"gorge": "gorge", "ravine": "ravine", "glen": "glen",
	"dale": "dale", "meadow": "meadow", "field": "field",
	"pasture": "pasture", "prairie": "prairie", "savanna": "savanna",
	"steppe": "steppe", "tundra": "tundra", "desert": "desert",
	"jungle": "jungle", "forest": "forest", "woodland": "woodland",
	"grove": "grove", "orchard": "orchard", "vineyard": "vineyard",
	"park": "park", "garden": "garden", "lawn": "lawn",
	"yard": "yard", "courtyard": "courtyard", "plaza": "plaza",
	"square": "square", "circle": "circle", "triangle": "triangle",
	"rectangle": "rectangle", "pentagon": "pentagon", "hexagon": "hexagon",
	"octagon": "octagon", "oval": "oval", "ellipse": "ellipse",
	"cube": "cube", "sphere": "sphere", "cylinder": "cylinder",
	"cone": "cone", "pyramid": "pyramid", "prism": "prism",
	"tetrahedron": "tetrahedron", "dodecahedron": "dodecahedron",
	"icosahedron": "icosahedron", "torus": "torus", "helix": "helix",
	"spiral": "spiral", "fractal": "fractal", "dimension": "dimension",
	"point": "point", "line": "line", "plane": "plane",
	"surface": "surface", "volume": "volume", "angle": "angle",
	"degree": "degree", "radian": "radian", "gradian": "gradian",
	"minute": "minute", "second": "second", "hour": "hour",
	"day": "day", "week": "week", "month": "month", "year": "year",
	"decade": "decade", "century": "century", "millennium": "millennium",
	"eon": "eon", "era": "era", "epoch": "epoch", "age": "age",
	"generation": "generation", "lifetime": "lifetime",
	"moment": "moment", "instant": "instant", "period": "period",
	"duration": "duration", "interval": "interval", "span": "span",
	"term": "term", "session": "session", "meeting": "meeting",
	"conference": "conference", "convention": "convention",
	"symposium": "symposium", "seminar": "seminar", "workshop": "workshop",
	"lecture": "lecture", "presentation": "presentation",
	"demonstration": "demonstration", "exhibition": "exhibition",
	"fair": "fair", "show": "show", "performance": "performance",
	"concert": "concert", "recital": "recital", "play": "play",
	"drama": "drama", "opera": "opera", "ballet": "ballet",
	"musical": "musical", "movie": "movie", "film": "film",
	"cinema": "cinema", "theater": "theater", "television": "television",
	"radio": "radio", "broadcast": "broadcast", "podcast": "podcast",
	"webcast": "webcast", "stream": "stream", "download": "download",
	"upload": "upload", "file": "file", "document": "document",
	"record": "record", "archive": "archive", "database": "database",
	"library": "library", "catalog": "catalog", "index": "index",
	"directory": "directory", "folder": "folder", "album": "album",
	"collection": "collection", "set": "set", "series": "series",
	"sequence": "sequence", "array": "array", "matrix": "matrix",
	"grid": "grid", "table": "table", "chart": "chart",
	"graph": "graph", "diagram": "diagram", "map": "map",
	"plan": "plan", "scheme": "scheme", "blueprint": "blueprint",
	"design": "design", "model": "model", "prototype": "prototype",
	"template": "template", "pattern": "pattern", "sample": "sample",
	"example": "example", "instance": "instance", "case": "case",
	"item": "item", "unit": "unit", "piece": "piece", "part": "part",
	"section": "section", "segment": "segment", "portion": "portion",
	"fraction": "fraction", "percentage": "percentage", "ratio": "ratio",
	"proportion": "proportion", "rate": "rate", "speed": "speed",
	"velocity": "velocity", "acceleration": "acceleration",
	"momentum": "momentum", "force": "force", "pressure": "pressure",
	"stress": "stress", "strain": "strain", "tension": "tension",
	"compression": "compression", "shear": "shear", "torque": "torque",
	"energy": "energy", "work": "work", "power": "power",
	"efficiency": "efficiency", "capacity": "capacity",
	"potential": "potential", "kinetic": "kinetic", "thermal": "thermal",
	"electrical": "electrical", "magnetic": "magnetic",
	"nuclear": "nuclear", "chemical": "chemical", "atomic": "atomic",
	"molecular": "molecular", "quantum": "quantum", "relativistic": "relativistic",
	"gravitational": "gravitational", "electromagnetic": "electromagnetic",
	"weak": "weak", "strong": "strong", "fundamental": "fundamental",
	"basic": "basic", "advanced": "advanced", "complex": "complex",
	"simple": "simple", "difficult": "difficult", "easy": "easy",
	"hard": "hard", "soft": "soft", "rigid": "rigid", "flexible": "flexible",
	"elastic": "elastic", "plastic": "plastic", "ductile": "ductile",
	"malleable": "malleable", "brittle": "brittle", "tough": "tough",
	"hardy": "hardy", "resilient": "resilient", "fragile": "fragile",
	"delicate": "delicate", "sturdy": "sturdy", "robust": "robust",
	"durable": "durable", "stable": "stable", "unstable": "unstable",
	"volatile": "volatile", "constant": "constant", "variable": "variable",
	"random": "random", "chaotic": "chaotic", "ordered": "ordered",
	"disordered": "disordered", "organized": "organized",
	"disorganized": "disorganized", "systematic": "systematic",
	"methodical": "methodical", "logical": "logical", "illogical": "illogical",
	"rational": "rational", "irrational": "irrational", "reasonable": "reasonable",
	"unreasonable": "unreasonable", "sensible": "sensible", "nonsensical": "nonsensical",
	"absurd": "absurd", "ridiculous": "ridiculous", "ludicrous": "ludicrous",
	"preposterous": "preposterous", "outrageous": "outrageous", "scandalous": "scandalous",
	"shocking": "shocking", "astonishing": "astonishing", "amazing": "amazing",
	"astounding": "astounding", "staggering": "staggering", "stunning": "stunning",
	"breathtaking": "breathtaking", "mindblowing": "mindblowing", "jawdropping": "jawdropping",
	"eyeopening": "eyeopening", "earthshaking": "earthshaking", "groundbreaking": "groundbreaking",
	"revolutionary": "revolutionary", "innovative": "innovative", "original": "original",
	"creative": "creative", "imaginative": "imaginative", "inventive": "inventive",
	"resourceful": "resourceful", "ingenious": "ingenious", "clever": "clever",
	"smart": "smart", "intelligent": "intelligent", "brilliant": "brilliant",
	"genius": "genius", "gifted": "gifted", "talented": "talented",
	"skilled": "skilled", "adept": "adept", "proficient": "proficient",
	"competent": "competent", "capable": "capable", "able": "able",
	"qualified": "qualified", "experienced": "experienced", "practiced": "practiced",
	"seasoned": "seasoned", "veteran": "veteran", "expert": "expert",
	"master": "master", "professional": "professional", "specialist": "specialist",
	"authority": "authority", "scholar": "scholar", "academic": "academic",
	"scientist": "scientist", "researcher": "researcher", "investigator": "investigator",
	"analyst": "analyst", "theorist": "theorist", "philosopher": "philosopher",
	"thinker": "thinker", "intellectual": "intellectual", "sage": "sage",
	"wise": "wise", "knowledgeable": "knowledgeable", "learned": "learned",
	"educated": "educated", "literate": "literate", "illiterate": "illiterate",
	"ignorant": "ignorant", "uninformed": "uninformed", "naive": "naive",
	"innocent": "innocent", "simple": "simple", "unsophisticated": "unsophisticated",
	"gullible": "gullible", "credulous": "credulous", "trusting": "trusting",
	"skeptical": "skeptical", "doubtful": "doubtful", "suspicious": "suspicious",
	"cynical": "cynical", "pessimistic": "pessimistic", "optimistic": "optimistic",
	"hopeful": "hopeful", "confident": "confident", "certain": "certain",
	"sure": "sure", "positive": "positive", "negative": "negative",
	"neutral": "neutral", "indifferent": "indifferent", "apathetic": "apathetic",
	"unconcerned": "unconcerned", "detached": "detached", "disinterested": "disinterested",
	"objective": "objective", "subjective": "subjective", "biased": "biased",
	"prejudiced": "prejudiced", "partial": "partial", "impartial": "impartial",
	"fair": "fair", "just": "just", "unjust": "unjust", "righteous": "righteous",
	"virtuous": "virtuous", "moral": "moral", "ethical": "ethical",
	"principled": "principled", "honorable": "honorable", "noble": "noble",
	"upstanding": "upstanding", "respectable": "respectable", "decent": "decent",
	"good": "good", "evil": "evil", "wicked": "wicked", "sinful": "sinful",
	"immoral": "immoral", "unethical": "unethical", "corrupt": "corrupt",
	"dishonest": "dishonest", "fraudulent": "fraudulent", "deceitful": "deceitful",
	"lying": "lying", "false": "false", "untrue": "untrue", "truthful": "truthful",
	"honest": "honest", "sincere": "sincere", "genuine": "genuine",
	"authentic": "authentic", "real": "real", "fake": "fake",
	"counterfeit": "counterfeit", "forged": "forged", "sham": "sham",
	"bogus": "bogus", "phony": "phony", "artificial": "artificial",
	"synthetic": "synthetic", "manmade": "manmade", "natural": "natural",
	"organic": "organic", "pure": "pure", "impure": "impure",
	"contaminated": "contaminated", "polluted": "polluted", "toxic": "toxic",
	"poisonous": "poisonous", "hazardous": "hazardous", "dangerous": "dangerous",
	"risky": "risky", "perilous": "perilous", "precarious": "precarious",
	"uncertain": "uncertain", "unpredictable": "unpredictable", "volatile": "volatile",
	"unstable": "unstable", "insecure": "insecure", "safe": "safe",
	"secure": "secure", "protected": "protected", "guarded": "guarded",
	"defended": "defended", "shielded": "shielded", "sheltered": "sheltered",
	"immune": "immune", "resistant": "resistant", "vulnerable": "vulnerable",
	"susceptible": "susceptible", "exposed": "exposed", "open": "open",
	"closed": "closed", "shut": "shut", "locked": "locked",
	"unlocked": "unlocked", "sealed": "sealed", "unsealed": "unsealed",
	"tight": "tight", "loose": "loose", "firm": "firm",
	"stable": "stable", "steady": "steady", "unsteady": "unsteady",
	"shaky": "shaky", "wobbly": "wobbly", "rocky": "rocky",
	"balanced": "balanced", "unbalanced": "unbalanced", "level": "level",
	"even": "even", "uneven": "uneven", "flat": "flat",
	"smooth": "smooth", "rough": "rough", "bumpy": "bumpy",
	"lumpy": "lumpy", "jagged": "jagged", "pointed": "pointed",
	"sharp": "sharp", "blunt": "blunt", "dull": "dull",
	"rounded": "rounded", "curved": "curved", "straight": "straight",
	"bent": "bent", "twisted": "twisted", "coiled": "coiled",
	"spiral": "spiral", "helical": "helical", "circular": "circular",
	"round": "round", "oval": "oval", "elliptical": "elliptical",
	"spherical": "spherical", "globular": "globular", "cylindrical": "cylindrical",
	"conical": "conical", "pyramidal": "pyramidal", "cubical": "cubical",
	"rectangular": "rectangular", "triangular": "triangular", "square": "square",
	"pentagonal": "pentagonal", "hexagonal": "hexagonal", "octagonal": "octagonal",
	"polygonal": "polygonal", "symmetrical": "symmetrical", "asymmetrical": "asymmetrical",
	"regular": "regular", "irregular": "irregular", "uniform": "uniform",
	"nonuniform": "nonuniform", "consistent": "consistent", "inconsistent": "inconsistent",
	"coherent": "coherent", "incoherent": "incoherent", "logical": "logical",
	"illogical": "illogical", "rational": "rational", "irrational": "irrational",
	"reasonable": "reasonable", "unreasonable": "unreasonable", "sensible": "sensible",
	"nonsensical": "nonsensical", "absurd": "absurd", "ridiculous": "ridiculous",
	"ludicrous": "ludicrous", "preposterous": "preposterous", "outrageous": "outrageous",
	"scandalous": "scandalous", "shocking": "shocking", "astonishing": "astonishing",
	"amazing": "amazing", "astounding": "astounding", "staggering": "staggering",
	"stunning": "stunning", "breathtaking": "breathtaking", "mindblowing": "mindblowing",
	"jawdropping": "jawdropping", "eyeopening": "eyeopening", "earthshaking": "earthshaking",
	"groundbreaking": "groundbreaking", "revolutionary": "revolutionary", "innovative": "innovative",
	"original": "original", "creative": "creative", "imaginative": "imaginative",
	"inventive": "inventive", "resourceful": "resourceful", "ingenious": "ingenious",
	"clever": "clever", "smart": "smart", "intelligent": "intelligent",
	"brilliant": "brilliant", "genius": "genius", "gifted": "gifted",
	"talented": "talented", "skilled": "skilled", "adept": "adept",
	"proficient": "proficient", "competent": "competent", "capable": "capable",
	"able": "able", "qualified": "qualified", "experienced": "experienced",
	"practiced": "practiced", "seasoned": "seasoned", "veteran": "veteran",
	"expert": "expert", "master": "master", "professional": "professional",
	"specialist": "specialist", "authority": "authority", "scholar": "scholar",
	"academic": "academic", "scientist": "scientist", "researcher": "researcher",
	"investigator": "investigator", "analyst": "analyst", "theorist": "theorist",
	"philosopher": "philosopher", "thinker": "thinker", "intellectual": "intellectual",
	"sage": "sage", "wise": "wise", "knowledgeable": "knowledgeable",
	"learned": "learned", "educated": "educated", "literate": "literate",
	"illiterate": "illiterate", "ignorant": "ignorant", "uninformed": "uninformed",
	"naive": "naive", "innocent": "innocent", "simple": "simple",
	"unsophisticated": "unsophisticated", "gullible": "gullible", "credulous": "credulous",
	"trusting": "trusting", "skeptical": "skeptical", "doubtful": "doubtful",
	"suspicious": "suspicious", "cynical": "cynical", "pessimistic": "pessimistic",
	"optimistic": "optimistic", "hopeful": "hopeful", "confident": "confident",
	"certain": "certain", "sure": "sure", "positive": "positive",
	"negative": "negative", "neutral": "neutral", "indifferent": "indifferent",
	"apathetic": "apathetic", "unconcerned": "unconcerned", "detached": "detached",
	"disinterested": "disinterested", "objective": "objective", "subjective": "subjective",
	"biased": "biased", "prejudiced": "prejudiced", "partial": "partial",
	"impartial": "impartial", "fair": "fair", "just": "just",
	"unjust": "unjust", "righteous": "righteous", "virtuous": "virtuous",
	"moral": "moral", "ethical": "ethical", "principled": "principled",
	"honorable": "honorable", "noble": "noble", "upstanding": "upstanding",
	"respectable": "respectable", "decent": "decent", "good": "good",
	"evil": "evil", "wicked": "wicked", "sinful": "sinful",
	"immoral": "immoral", "unethical": "unethical", "corrupt": "corrupt",
	"dishonest": "dishonest", "fraudulent": "fraudulent", "deceitful": "deceitful",
	"lying": "lying", "false": "false", "untrue": "untrue",
	"truthful": "truthful", "honest": "honest", "sincere": "sincere",
	"genuine": "genuine", "authentic": "authentic", "real": "real",
	"fake": "fake", "counterfeit": "counterfeit", "forged": "forged",
	"sham": "sham", "bogus": "bogus", "phony": "phony",
	"artificial": "artificial", "synthetic": "synthetic", "manmade": "manmade",
	"natural": "natural", "organic": "organic", "pure": "pure",
	"impure": "impure", "contaminated": "contaminated", "polluted": "polluted",
	"toxic": "toxic", "poisonous": "poisonous", "hazardous": "hazardous",
	"dangerous": "dangerous", "risky": "risky", "perilous": "perilous",
	"precarious": "precarious", "uncertain": "uncertain", "unpredictable": "unpredictable",
	"volatile": "volatile", "unstable": "unstable", "insecure": "insecure",
	"safe": "safe", "secure": "secure", "protected": "protected",
	"guarded": "guarded", "defended": "defended", "shielded": "shielded",
	"sheltered": "sheltered", "immune": "immune", "resistant": "resistant",
	"vulnerable": "vulnerable", "susceptible": "susceptible", "exposed": "exposed",
	"open": "open", "closed": "closed", "shut": "shut",
	"locked": "locked", "unlocked": "unlocked", "sealed": "sealed",
	"unsealed": "unsealed", "tight": "tight", "loose": "loose",
	"firm": "firm", "stable": "stable", "steady": "steady",
	"unsteady": "unsteady", "shaky": "shaky", "wobbly": "wobbly",
	"rocky": "rocky", "balanced": "balanced", "unbalanced": "unbalanced",
	"level": "level", "even": "even", "uneven": "uneven",
	"flat": "flat", "smooth": "smooth", "rough": "rough",
	"bumpy": "bumpy", "lumpy": "lumpy", "jagged": "jagged",
	"pointed": "pointed", "sharp": "sharp", "blunt": "blunt",
	"dull": "dull", "rounded": "rounded", "curved": "curved",
	"straight": "straight", "bent": "bent", "twisted": "twisted",
	"coiled": "coiled", "spiral": "spiral", "helical": "helical",
	"circular": "circular", "round": "round", "oval": "oval",
	"elliptical": "elliptical", "spherical": "spherical", "globular": "globular",
	"cylindrical": "cylindrical", "conical": "conical", "pyramidal": "pyramidal",
	"cubical": "cubical", "rectangular": "rectangular", "triangular": "triangular",
	"square": "square", "pentagonal": "pentagonal", "hexagonal": "hexagonal",
	"octagonal": "octagonal", "polygonal": "polygonal", "symmetrical": "symmetrical",
	"asymmetrical": "asymmetrical", "regular": "regular", "irregular": "irregular",
	"uniform": "uniform", "nonuniform": "nonuniform", "consistent": "consistent",
	"inconsistent": "inconsistent", "coherent": "coherent", "incoherent": "incoherent",
	"logical": "logical", "illogical": "illogical", "rational": "rational",
	"irrational": "irrational", "reasonable": "reasonable", "unreasonable": "unreasonable",
	"sensible": "sensible", "nonsensical": "nonsensical", "absurd": "absurd",
	"ridiculous": "ridiculous", "ludicrous": "ludicrous", "preposterous": "preposterous",
	"outrageous": "outrageous", "scandalous": "scandalous", "shocking": "shocking",
	"astonishing": "astonishing", "amazing": "amazing", "astounding": "astounding",
	"staggering": "staggering", "stunning": "stunning", "breathtaking": "breathtaking",
	"mindblowing": "mindblowing", "jawdropping": "jawdropping", "eyeopening": "eyeopening",
	"earthshaking": "earthshaking", "groundbreaking": "groundbreaking", "revolutionary": "revolutionary",
	"innovative": "innovative", "original": "original", "creative": "creative",
	"imaginative": "imaginative", "inventive": "inventive", "resourceful": "resourceful",
	"ingenious": "ingenious", "clever": "clever", "smart": "smart",
	"intelligent": "intelligent", "brilliant": "brilliant", "genius": "genius",
	"gifted": "gifted", "talented": "talented", "skilled": "skilled",
	"adept": "adept", "proficient": "proficient", "competent": "competent",
	"capable": "capable", "able": "able", "qualified": "qualified",
	"experienced": "experienced", "practiced": "practiced", "seasoned": "seasoned",
	"veteran": "veteran", "expert": "expert", "master": "master",
	"professional": "professional", "specialist": "specialist", "authority": "authority",
	"scholar": "scholar", "academic": "academic", "scientist": "scientist",
	"researcher": "researcher", "investigator": "investigator", "analyst": "analyst",
	"theorist": "theorist", "philosopher": "philosopher", "thinker": "thinker",
	"intellectual": "intellectual", "sage": "sage", "wise": "wise",
	"knowledgeable": "knowledgeable", "learned": "learned", "educated": "educated",
	"literate": "literate", "illiterate": "illiterate", "ignorant": "ignorant",
	"uninformed": "uninformed", "naive": "naive", "innocent": "innocent",
	"simple": "simple", "unsophisticated": "unsophisticated", "gullible": "gullible",
	"credulous": "credulous", "trusting": "trusting", "skeptical": "skeptical",
	"doubtful": "doubtful", "suspicious": "suspicious", "cynical": "cynical",
	"pessimistic": "pessimistic", "optimistic": "optimistic", "hopeful": "hopeful",
	"confident": "confident", "certain": "certain", "sure": "sure",
	"positive": "positive", "negative": "negative", "neutral": "neutral",
	"indifferent": "indifferent", "apathetic": "apathetic", "unconcerned": "unconcerned",
	"detached": "detached", "disinterested": "disinterested", "objective": "objective",
	"subjective": "subjective", "biased": "biased", "prejudiced": "prejudiced",
	"partial": "partial", "impartial": "impartial", "fair": "fair",
	"just": "just", "unjust": "unjust", "righteous": "righteous",
	"virtuous": "virtuous", "moral": "moral", "ethical": "ethical",
	"principled": "principled", "honorable": "honorable", "noble": "noble",
	"upstanding": "upstanding", "respectable": "respectable", "decent": "decent",
	"good": "good", "evil": "evil", "wicked": "wicked",
	"sinful": "sinful", "immoral": "immoral", "unethical": "unethical",
	"corrupt": "corrupt", "dishonest": "dishonest", "fraudulent": "fraudulent",
	"deceitful": "deceitful", "lying": "lying", "false": "false",
	"untrue": "untrue", "truthful": "truthful", "honest": "honest",
	"sincere": "sincere", "genuine": "genuine", "authentic": "authentic",
	"real": "real", "fake": "fake", "counterfeit": "counterfeit",
	"forged": "forged", "sham": "sham", "bogus": "bogus",
	"phony": "phony", "artificial": "artificial", "synthetic": "synthetic",
	"manmade": "manmade", "natural": "natural", "organic": "organic",
	"pure": "pure", "impure": "impure", "contaminated": "contaminated",
	"polluted": "polluted", "toxic": "toxic", "poisonous": "poisonous",
	"hazardous": "hazardous", "dangerous": "dangerous", "risky": "risky",
	"perilous": "perilous", "precarious": "precarious", "uncertain": "uncertain",
	"unpredictable": "unpredictable", "volatile": "volatile", "unstable": "unstable",
	"insecure": "insecure", "safe": "safe", "secure": "secure",
	"protected": "protected", "guarded": "guarded", "defended": "defended",
	"shielded": "shielded", "sheltered": "sheltered", "immune": "immune",
	"resistant": "resistant", "vulnerable": "vulnerable", "susceptible": "susceptible",
	"exposed": "exposed", "open": "open", "closed": "closed",
	"shut": "shut", "locked": "locked", "unlocked": "unlocked",
	"sealed": "sealed", "unsealed": "unsealed", "tight": "tight",
	"loose": "loose", "firm": "firm", "stable": "stable",
	"steady": "steady", "unsteady": "unsteady", "shaky": "shaky",
	"wobbly": "wobbly", "rocky": "rocky", "balanced": "balanced",
	"unbalanced": "unbalanced", "level": "level", "even": "even",
	"uneven": "uneven", "flat": "flat", "smooth": "smooth",
	"rough": "rough", "bumpy": "bumpy", "lumpy": "lumpy",
	"jagged": "jagged", "pointed": "pointed", "sharp": "sharp",
	"blunt": "blunt", "dull": "dull", "rounded": "rounded",
	"curved": "curved", "straight": "straight", "bent": "bent",
	"twisted": "twisted", "coiled": "coiled", "spiral": "spiral",
	"helical": "helical", "circular": "circular", "round": "round",
	"oval": "oval", "elliptical": "elliptical", "spherical": "spherical",
	"globular": "globular", "cylindrical": "cylindrical", "conical": "conical",
	"pyramidal": "pyramidal", "cubical": "cubical", "rectangular": "rectangular",
	"triangular": "triangular", "square": "square", "pentagonal": "pentagonal",
	"hexagonal": "hexagonal", "octagonal": "octagonal", "polygonal": "polygonal",
	"symmetrical": "symmetrical", "asymmetrical": "asymmetrical", "regular": "regular",
	"irregular": "irregular", "uniform": "uniform", "nonuniform": "nonuniform",
	"consistent": "consistent", "inconsistent": "inconsistent", "coherent": "coherent",
	"incoherent": "incoherent", "logical": "logical", "illogical": "illogical",
	"rational": "rational", "irrational": "irrational", "reasonable": "reasonable",
	"unreasonable": "unreasonable", "sensible": "sensible", "nonsensical": "nonsensical",
	"absurd": "absurd", "ridiculous": "ridiculous", "ludicrous": "ludicrous",
	"preposterous": "preposterous", "outrageous": "outrageous", "scandalous": "scandalous",
	"shocking": "shocking", "astonishing": "astonishing", "amazing": "amazing",
	"astounding": "astounding", "staggering": "staggering", "stunning": "stunning",
	"breathtaking": "breathtaking", "mindblowing": "mindblowing", "jawdropping": "jawdropping",
	"eyeopening": "eyeopening", "earthshaking": "earthshaking", "groundbreaking": "groundbreaking",
	"revolutionary": "revolutionary", "innovative": "innovative", "original": "original",
	"creative": "creative", "imaginative": "imaginative", "inventive": "inventive",
	"resourceful": "resourceful", "ingenious": "ingenious", "clever": "clever",
	"smart": "smart", "intelligent": "intelligent", "brilliant": "brilliant",
	"genius": "genius", "gifted": "gifted", "talented": "talented",
	"skilled": "skilled", "adept": "adept", "proficient": "proficient",
	"competent": "competent", "capable": "capable", "able": "able",
	"qualified": "qualified", "experienced": "experienced", "practiced": "practiced",
	"seasoned": "seasoned", "veteran": "veteran", "expert": "expert",
	"master": "master", "professional": "professional", "specialist": "specialist",
	"authority": "authority", "scholar": "scholar", "academic": "academic",
	"scientist": "scientist", "researcher": "researcher", "investigator": "investigator",
	"analyst": "analyst", "theorist": "theorist", "philosopher": "philosopher",
	"thinker": "thinker", "intellectual": "intellectual", "sage": "sage",
	"wise": "wise", "knowledgeable": "knowledgeable", "learned": "learned",
	"educated": "educated", "literate": "literate", "illiterate": "illiterate",
	"ignorant": "ignorant", "uninformed": "uninformed", "naive": "naive",
	"innocent": "innocent", "simple": "simple", "unsophisticated": "unsophisticated",
	"gullible": "gullible", "credulous": "credulous", "trusting": "trusting",
	"skeptical": "skeptical", "doubtful": "doubtful", "suspicious": "suspicious",
	"cynical": "cynical", "pessimistic": "pessimistic", "optimistic": "optimistic",
	"hopeful": "hopeful", "confident": "confident", "certain": "certain",
	"sure": "sure", "positive": "positive", "negative": "negative",
	"neutral": "neutral", "indifferent": "indifferent", "apathetic": "apathetic",
	"unconcerned": "unconcerned", "detached": "detached", "disinterested": "disinterested",
	"objective": "objective", "subjective": "subjective", "biased": "biased",
	"prejudiced": "prejudiced", "partial": "partial", "impartial": "impartial",
	"fair": "fair", "just": "just", "unjust": "unjust",
	"righteous": "righteous", "virtuous": "virtuous", "moral": "moral",
	"ethical": "ethical", "principled": "principled", "honorable": "honorable",
	"noble": "noble", "upstanding": "upstanding", "respectable": "respectable",
	"decent": "decent", "good": "good", "evil": "evil",
	"wicked": "wicked", "sinful": "sinful", "immoral": "immoral",
	"unethical": "unethical", "corrupt": "corrupt", "dishonest": "dishonest",
	"fraudulent": "fraudulent", "deceitful": "deceitful", "lying": "lying",
	"false": "false", "untrue": "untrue", "truthful": "truthful",
	"honest": "honest", "sincere": "sincere", "genuine": "genuine",
	"authentic": "authentic", "real": "real", "fake": "fake",
	"counterfeit": "counterfeit", "forged": "forged", "sham": "sham",
	"bogus": "bogus", "phony": "phony", "artificial": "artificial",
	"synthetic": "synthetic", "manmade": "manmade", "natural": "natural",
	"organic": "organic", "pure": "pure", "impure": "impure",
	"contaminated": "contaminated", "polluted": "polluted", "toxic": "toxic",
	"poisonous": "poisonous", "hazardous": "hazardous", "dangerous": "dangerous",
	"risky": "risky", "perilous": "perilous", "precarious": "precarious",
	"uncertain": "uncertain", "unpredictable": "unpredictable", "volatile": "volatile",
	"unstable": "unstable", "insecure": "insecure", "safe": "safe",
	"secure": "secure", "protected": "protected", "guarded": "guarded",
	"defended": "defended", "shielded": "shielded", "sheltered": "sheltered",
	"immune": "immune", "resistant": "resistant", "vulnerable": "vulnerable",
	"susceptible": "susceptible", "exposed": "exposed", "open": "open",
	"closed": "closed", "shut": "shut", "locked": "locked",
	"unlocked": "unlocked", "sealed": "sealed", "unsealed": "unsealed",
	"tight": "tight", "loose": "loose", "firm": "firm",
	"stable": "stable", "steady": "steady", "unsteady": "unsteady",
	"shaky": "shaky", "wobbly": "wobbly", "rocky": "rocky",
	"balanced": "balanced", "unbalanced": "unbalanced", "level": "level",
	"even": "even", "uneven": "uneven", "flat": "flat",
	"smooth": "smooth", "rough": "rough", "bumpy": "bumpy",
	"lumpy": "lumpy", "jagged": "jagged", "pointed": "pointed",
	"sharp": "sharp", "blunt": "blunt", "dull": "dull",
	"rounded": "rounded", "curved": "curved", "straight": "straight",
	"bent": "bent", "twisted": "twisted", "coiled": "coiled",
	"spiral": "spiral", "helical": "helical", "circular": "circular",
	"round": "round", "oval": "oval", "elliptical": "elliptical",
	"spherical": "spherical", "globular": "globular", "cylindrical": "cylindrical",
	"conical": "conical", "pyramidal": "pyramidal", "cubical": "cubical",
	"rectangular": "rectangular", "triangular": "triangular", "square": "square",
	"pentagonal": "pentagonal", "hexagonal": "hexagonal", "octagonal": "octagonal",
	"polygonal": "polygonal", "symmetrical": "symmetrical", "asymmetrical": "asymmetrical",
	"regular": "regular", "irregular": "irregular", "uniform": "uniform",
	"nonuniform": "nonuniform", "consistent": "consistent", "inconsistent": "inconsistent",
	"coherent": "coherent", "incoherent": "incoherent", "logical": "logical",
	"illogical": "illogical", "rational": "rational", "irrational": "irrational",
	"reasonable": "reasonable", "unreasonable": "unreasonable", "sensible": "sensible",
	"nonsensical": "nonsensical", "absurd": "absurd", "ridiculous": "ridiculous",
	"ludicrous": "ludicrous", "preposterous": "preposterous", "outrageous": "outrageous",
	"scandalous": "scandalous", "shocking": "shocking", "astonishing": "astonishing",
	"amazing": "amazing", "astounding": "astounding", "staggering": "staggering",
	"stunning": "stunning", "breathtaking": "breathtaking", "mindblowing": "mindblowing",
	"jawdropping": "jawdropping", "eyeopening": "eyeopening", "earthshaking": "earthshaking",
	"groundbreaking": "groundbreaking", "revolutionary": "revolutionary", "innovative": "innovative",
	"original": "original", "creative": "creative", "imaginative": "imaginative",
	"inventive": "inventive", "resourceful": "resourceful", "ingenious": "ingenious",
	"clever": "clever", "smart": "smart", "intelligent": "intelligent",
	"brilliant": "brilliant", "genius": "genius", "gifted": "gifted",
	"talented": "talented", "skilled": "skilled", "adept": "adept",
	"proficient": "proficient", "competent": "competent", "capable": "capable",
	"able": "able", "qualified": "qualified", "experienced": "experienced",
	"practiced": "practiced", "seasoned": "seasoned", "veteran": "veteran",
	"expert": "expert", "master": "master", "professional": "professional",
	"specialist": "specialist", "authority": "authority", "scholar": "scholar",
	"academic": "academic", "scientist": "scientist", "researcher": "researcher",
	"investigator": "investigator", "analyst": "analyst", "theorist": "theorist",
	"philosopher": "philosopher", "thinker": "thinker", "intellectual": "intellectual",
	"sage": "sage", "wise": "wise", "knowledgeable": "knowledgeable",
	"learned": "learned", "educated": "educated", "literate": "literate",
	"illiterate": "illiterate"
	}
	return cases

	def _build_special_regex(self):
	"""Regex để nhận diện các từ đặc biệt"""
	words = sorted(self.special_cases.keys(), key=len, reverse=True)
	return re.compile(r'\b(' + '\|'.join(map(re.escape, words)) + r')\b', flags=re.IGNORECASE)

	def _build_abbreviation_patterns(self):
	"""Xử lý các từ viết tắt"""
	return {
	# Viết tắt chung
	r"\betc\.?\b": "et cetera ",
	r"\bvs\.?\b": "versus ",
	r"\be\.g\.\b": "for example ",
	r"\bi\.e\.\b": "that is ",
	r"\bDr\.?\b": "Doctor ",
	r"\bMr\.?\b": "Mister ",
	r"\bMrs\.?\b": "Misses ",
	r"\bMs\.?\b": "Miss ",
	r"\bProf\.?\b": "Professor ",
	r"\bSt\.?\b": "Saint ",
	r"\bAve\.?\b": "Avenue ",
	r"\bBlvd\.?\b": "Boulevard ",
	r"\bRd\.?\b": "Road ",
	r"\bJan\.?\b": "January ",
	r"\bFeb\.?\b": "February ",
	r"\bMar\.?\b": "March ",
	r"\bApr\.?\b": "April ",
	r"\bJun\.?\b": "June ",
	r"\bJul\.?\b": "July ",
	r"\bAug\.?\b": "August ",
	r"\bSep(?:t)?\.?\b": "September ",
	r"\bOct\.?\b": "October ",
	r"\bNov\.?\b": "November ",
	r"\bDec\.?\b": "December ",
	r"\bapprox\.?\b": "approximately ",
	r"\bmin\.?\b": "minute ",
	r"\bmax\.?\b": "maximum ",
	r"\bdept\.?\b": "department ",

	# Số thứ tự
	r"\b1st\b": "first ",
	r"\b2nd\b": "second ",
	r"\b3rd\b": "third ",
	r"\b4th\b": "fourth ",
	r"\b5th\b": "fifth ",
	r"\b6th\b": "sixth ",
	r"\b7th\b": "seventh ",
	r"\b8th\b": "eighth ",
	r"\b9th\b": "ninth ",
	r"\b10th\b": "tenth ",
	r"\b11th\b": "eleventh ",
	r"\b12th\b": "twelfth ",
	r"\b13th\b": "thirteenth ",
	r"\b14th\b": "fourteenth ",
	r"\b15th\b": "fifteenth ",
	r"\b20th\b": "twentieth ",
	r"\b21st\b": "twenty first ",
	r"\b22nd\b": "twenty second ",
	r"\b23rd\b": "twenty third ",
	r"\b30th\b": "thirtieth ",
	r"\b31st\b": "thirty first ",

	# Số đếm
	r"\b0\b": "zero ",
	r"\b1\b": "one ",
	r"\b2\b": "two ",
	r"\b3\b": "three ",
	r"\b4\b": "four ",
	r"\b5\b": "five ",
	r"\b6\b": "six ",
	r"\b7\b": "seven ",
	r"\b8\b": "eight ",
	r"\b9\b": "nine ",
	r"\b10\b": "ten ",
	r"\b11\b": "eleven ",
	r"\b12\b": "twelve ",
	r"\b13\b": "thirteen ",
	r"\b14\b": "fourteen ",
	r"\b15\b": "fifteen ",
	r"\b16\b": "sixteen ",
	r"\b17\b": "seventeen ",
	r"\b18\b": "eighteen ",
	r"\b19\b": "nineteen ",
	r"\b20\b": "twenty ",
	r"\b30\b": "thirty ",
	r"\b40\b": "forty ",
	r"\b50\b": "fifty ",
	r"\b60\b": "sixty ",
	r"\b70\b": "seventy ",
	r"\b80\b": "eighty ",
	r"\b90\b": "ninety ",
	r"\b100\b": "one hundred ",

	# World Wars
	r"\bWorld War I\b": "World War One",
	r"\bWorld War II\b": "World War Two",
	r"\bWorld War III\b": "World War Three", # Optional
	r"\bWorld War IV\b": "World War Four", # Optional

	# Roman Emperors & Byzantine rulers
	r"\bTheodosius I\b": "Theodosius the First",
	r"\bTheodosius II\b": "Theodosius the Second",
	r"\bConstantine I\b": "Constantine the First",
	r"\bConstantine II\b": "Constantine the Second",
	r"\bConstantine III\b": "Constantine the Third",
	r"\bJustinian I\b": "Justinian the First",
	r"\bJustinian II\b": "Justinian the Second",
	r"\bAlexander I\b": "Alexander the First",
	r"\bAlexander II\b": "Alexander the Second",
	r"\bAlexander III\b": "Alexander the Third",

	# English monarchs
	r"\bHenry I\b": "Henry the First",
	r"\bHenry II\b": "Henry the Second",
	r"\bHenry III\b": "Henry the Third",
	r"\bHenry IV\b": "Henry the Fourth",
	r"\bHenry V\b": "Henry the Fifth",
	r"\bHenry VI\b": "Henry the Sixth",
	r"\bHenry VII\b": "Henry the Seventh",
	r"\bHenry VIII\b": "Henry the Eighth",
	r"\bEdward I\b": "Edward the First",
	r"\bEdward II\b": "Edward the Second",
	r"\bEdward III\b": "Edward the Third",
	r"\bEdward IV\b": "Edward the Fourth",
	r"\bEdward V\b": "Edward the Fifth",
	r"\bEdward VI\b": "Edward the Sixth",
	r"\bEdward VII\b": "Edward the Seventh",
	r"\bEdward VIII\b": "Edward the Eighth",
	r"\bCharles I\b": "Charles the First",
	r"\bCharles II\b": "Charles the Second",
	r"\bCharles III\b": "Charles the Third",
	r"\bJames I\b": "James the First",
	r"\bJames II\b": "James the Second",
	r"\bWilliam I\b": "William the First",
	r"\bWilliam II\b": "William the Second",
	r"\bElizabeth I\b": "Elizabeth the First",
	r"\bElizabeth II\b": "Elizabeth the Second",

	# French monarchs
	r"\bLouis I\b": "Louis the First",
	r"\bLouis II\b": "Louis the Second",
	r"\bLouis III\b": "Louis the Third",
	r"\bLouis IV\b": "Louis the Fourth",
	r"\bLouis V\b": "Louis the Fifth",
	r"\bLouis VI\b": "Louis the Sixth",
	r"\bLouis VII\b": "Louis the Seventh",
	r"\bLouis VIII\b": "Louis the Eighth",
	r"\bLouis IX\b": "Louis the Ninth",
	r"\bLouis X\b": "Louis the Tenth",
	r"\bLouis XI\b": "Louis the Eleventh",
	r"\bLouis XII\b": "Louis the Twelfth",
	r"\bLouis XIII\b": "Louis the Thirteenth",
	r"\bLouis XIV\b": "Louis the Fourteenth",
	r"\bLouis XV\b": "Louis the Fifteenth",
	r"\bLouis XVI\b": "Louis the Sixteenth",
	r"\bPhilip II\b": "Philip the Second",
	r"\bPhilip IV\b": "Philip the Fourth",

	# Russian monarchs
	r"\bNicholas I\b": "Nicholas the First",
	r"\bNicholas II\b": "Nicholas the Second",
	r"\bPeter I\b": "Peter the First",
	r"\bPeter II\b": "Peter the Second",
	r"\bPeter III\b": "Peter the Third",
	r"\bCatherine II\b": "Catherine the Second",

	# Popes
	r"\bPope John Paul I\b": "Pope John Paul the First",
	r"\bPope John Paul II\b": "Pope John Paul the Second",
	r"\bPope Benedict XVI\b": "Pope Benedict the Sixteenth",
	r"\bPope Pius XII\b": "Pope Pius the Twelfth",
	r"\bPope Leo XIII\b": "Pope Leo the Thirteenth",
	r"\bPope Innocent III\b": "Pope Innocent the Third",
	r"\bPope Gregory XIII\b": "Pope Gregory the Thirteenth",

	# Other famous Roman numeral events/titles
	r"\bSuper Bowl I\b": "Super Bowl One",
	r"\bSuper Bowl II\b": "Super Bowl Two",
	r"\bSuper Bowl III\b": "Super Bowl Three",
	r"\bSuper Bowl IV\b": "Super Bowl Four",
	r"\bSuper Bowl V\b": "Super Bowl Five",
	r"\bSuper Bowl X\b": "Super Bowl Ten",
	r"\bSuper Bowl XX\b": "Super Bowl Twenty",
	r"\bFinal Fantasy VII\b": "Final Fantasy Seven",
	r"\bFinal Fantasy VIII\b": "Final Fantasy Eight",
	r"\bFinal Fantasy IX\b": "Final Fantasy Nine",
	r"\bFinal Fantasy X\b": "Final Fantasy Ten"
	}

	def process_text(self, text: str) -> str:
	"""Chuẩn hóa văn bản giữ nguyên ngữ cảnh"""
	# Bước 1: Xử lý từ viết tắt
	for pattern, replacement in self.abbreviation_patterns.items():
	text = re.sub(pattern, replacement, text, flags=re.IGNORECASE)

	# Bước 2: Chuẩn hóa từ đặc biệt (giữ nguyên case)
	def replace_match(match):
	word = match.group(0)
	return self.special_cases.get(word.lower(), word)

	processed_text = self.special_regex.sub(replace_match, text)

	# Bước 3: Chuẩn hóa khoảng trắng
	processed_text = ' '.join(processed_text.split())

	return processed_text

	@staticmethod
	def split_num(num: re.Match) -> str:
	num = num.group()
	if ':' in num:
	hours, minutes = map(int, num.split(':'))
	if minutes == 0:
	return f"{hours} o'clock"
	elif minutes < 10:
	return f'{hours} oh {minutes}'
	return f'{hours} {minutes}'

	year = int(num[:4])
	if year < 1100 or year % 1000 < 10:
	return num

	left, right = num[:2], int(num[2:4])
	suffix = 's' if num.endswith('s') else ''

	if 100 <= year % 1000 <= 999:
	if right == 0:
	return f'{left} hundred{suffix}'
	elif right < 10:
	return f'{left} oh {right}{suffix}'
	return f'{left} {right}{suffix}'

	@staticmethod
	def flip_money(match: re.Match) -> str:
	m = match.group()
	currency = 'dollar' if m[0] == '$' else 'pound'

	if '.' not in m:
	singular = '' if m[1:] == '1' else 's'
	return f'{m[1:]} {currency}{singular}'

	whole, cents = m[1:].split('.')
	singular = '' if whole == '1' else 's'
	cents = int(cents.ljust(2, '0'))
	coins = f"cent{'' if cents == 1 else 's'}" if m[0] == '$' else ('penny' if cents == 1 else 'pence')
	return f'{whole} {currency}{singular} and {cents} {coins}'

	@staticmethod
	def point_num(match):
	whole, fractional = match.group().split('.')
	return ' point '.join([whole, ' '.join(fractional)])

	def normalize_text(self, text: str) -> str:
	replacements = {
	chr(8216): "'",
	chr(8217): "'",
	'«': chr(8220),
	'»': chr(8221),
	chr(8220): '"',
	chr(8221): '"',
	'(': '«',
	')': '»'
	}
	for old, new in replacements.items():
	text = text.replace(old, new)

	punctuation_replacements = {
	'、': ',',
	'。': '.',
	'！': '!',
	'，': ',',
	'：': ':',
	'；': ';',
	'？': '?',
	}
	for old, new in punctuation_replacements.items():
	text = text.replace(old, new + ' ')

	text = re.sub(r'[^\S\n]', ' ', text)
	text = re.sub(r' +', ' ', text)
	text = re.sub(r'(?<=\n) +(?=\n)', '', text)

	abbreviation_patterns = [
	(r'\bD[Rr]\.(?= [A-Z])', 'Doctor'),
	(r'\b(?:Mr\.\|MR\.(?= [A-Z]))', 'Mister'),
	(r'\b(?:Ms\.\|MS\.(?= [A-Z]))', 'Miss'),
	(r'\b(?:Mrs\.\|MRS\.(?= [A-Z]))', 'Mrs'),
	(r'\betc\.(?! [A-Z])', 'etc'),
	(r'(?i)\b(y)eah?\b', r"\1e'a"),
	]
	for pattern, replacement in abbreviation_patterns:
	text = re.sub(pattern, replacement, text)

	text = re.sub(r'\d*\.\d+\|\b\d{4}s?\b\|(?<!:)\b(?:[1-9]\|1[0-2]):[0-5]\d\b(?!:)', self.split_num, text)
	text = re.sub(r'(?<=\d),(?=\d)', '', text)
	text = re.sub(
	r'(?i)[$£]\d+(?:\.\d+)?(?: hundred\| thousand\| (?:[bm]\|tr)illion)*\b\|[$£]\d+\.\d\d?\b',
	self.flip_money,
	text
	)
	text = re.sub(r'\d*\.\d+', self.point_num, text)
	text = re.sub(r'(?<=\d)-(?=\d)', ' to ', text)

	text = re.sub(r'(?<=\d)S', ' S', text)
	text = re.sub(r"(?<=[BCDFGHJ-NP-TV-Z])'?s\b", "'S", text)
	text = re.sub(r"(?<=X')S\b", 's', text)

	text = re.sub(r'(?:[A-Za-z]\.){2,} [a-z]', lambda m: m.group().replace('.', '-'), text)
	text = re.sub(r'(?i)(?<=[A-Z])\.(?=[A-Z])', '-', text)

	return text.strip()

	def tokenize(self, phonemes: str) -> List[int]:
	return [self.VOCAB[x] for x in phonemes if x in self.VOCAB]

	def phonemize(self, text: str, lang: str = 'en-us', normalize: bool = True) -> str:
	if normalize:
	text = self.normalize_text(text)

	if lang not in self.phonemizers:
	print(f"Language '{lang}' not supported. Defaulting to 'en-us'.")
	lang = 'en-us'

	phonemes = self.phonemizers[lang].phonemize([text])
	phonemes = phonemes[0] if phonemes else ''

	replacements = {
	'kəkˈoːɹoʊ': 'kˈoʊkəɹoʊ',
	'kəkˈɔːɹəʊ': 'kˈəʊkəɹəʊ',
	'ʲ': 'j',
	'r': 'ɹ',
	'x': 'k',
	'ɬ': 'l',
	}
	for old, new in replacements.items():
	phonemes = phonemes.replace(old, new)

	phonemes = re.sub(r'(?<=[a-zɹː])(?=hˈʌndɹɪd)', ' ', phonemes)
	phonemes = re.sub(r' z(?=[;:,.!?¡¿—…"«»“” ]\|$)', 'z', phonemes)

	if lang == 'a':
	phonemes = re.sub(r'(?<=nˈaɪn)ti(?!ː)', 'di', phonemes)

	phonemes = ''.join(filter(lambda p: p in self.VOCAB, phonemes))
	return phonemes.strip()

	# Khởi tạo môi trường - Ưu tiên GPU
	CUDA_AVAILABLE = torch.cuda.is_available()

	class TTSModel:
	def __init__(self):
	self.use_cuda = CUDA_AVAILABLE
	self.models = {}
	self.tokenizer = Tokenizer()
	self.voice_cache = {}
	self.voice_files = self._discover_voices()

	try:
	if self.use_cuda:
	self.models['cuda'] = torch.compile(KModel().to('cuda').eval(), mode='max-autotune')
	with torch.no_grad():
	_ = self.models['cuda'](torch.randn(1, 64).cuda(), torch.randn(1, 80, 100).cuda(), 1.0)

	self.models['cpu'] = KModel().to('cpu').eval()
	except Exception as e:
	print(f"Error loading model: {e}")
	self.models = {'cpu': KModel().to('cpu').eval()}

	self.pipelines = {
	'a': KPipeline(lang_code='a', model=False),
	'b': KPipeline(lang_code='b', model=False)
	}

	def _discover_voices(self):
	"""Discover available voice files in the voices folder"""
	voice_files = {}
	voices_dir = "voices"

	if not os.path.exists(voices_dir):
	os.makedirs(voices_dir)
	print(f"Created voices directory at {os.path.abspath(voices_dir)}")
	return voice_files

	for file in os.listdir(voices_dir):
	if file.endswith(".pt"):
	voice_name = os.path.splitext(file)[0]
	voice_files[voice_name] = os.path.join(voices_dir, file)
	print(f"Found voice: {voice_name}")

	return voice_files

	def get_voice_list(self):
	"""Get list of available voices for the UI"""
	voices = list(self.voice_files.keys())
	if not voices:
	print("Warning: No voice files found in voices folder")
	return voices

	model_manager = TTSModel()

	class TextProcessor:
	@staticmethod
	def clean_text(text: str) -> str:
	text = TextProcessor._process_special_cases(text)

	re_tab = re.compile(r'[\r\t]')
	re_spaces = re.compile(r' +')
	re_punctuation = re.compile(r'(\s)([,.!?])')

	text = re_tab.sub(' ', text)
	text = re_spaces.sub(' ', text)
	text = re_punctuation.sub(r'\2', text)
	return text.strip()

	@staticmethod
	def _process_special_cases(text: str) -> str:
	"""Pipeline xử lý đặc biệt với thứ tự tối ưu"""
	text = TextProcessor._process_emails(text)
	text = TextProcessor._process_websites(text)
	text = TextProcessor._process_phone_numbers(text)
	text = TextProcessor._process_temperatures(text)
	text = TextProcessor._process_measurements(text)
	text = TextProcessor._process_currency(text)
	text = TextProcessor._process_percentages(text)
	text = TextProcessor._process_math_operations(text)
	text = TextProcessor._process_times(text)
	text = TextProcessor._process_years(text)
	text = TextProcessor._process_special_symbols(text)

	return text

	@staticmethod
	def _process_emails(text: str) -> str:
	"""Process emails with correct English pronunciation for all special characters"""
	def convert_email(match):
	full_email = match.group(0)
	# Replace each special character with its English pronunciation
	processed = (full_email
	.replace('@', ' at ')
	.replace('.', ' dot ')
	.replace('-', ' dash ')
	.replace('_', ' underscore ')
	.replace('+', ' plus ')
	.replace('/', ' slash ')
	.replace('=', ' equals '))
	return processed

	# Regex to match all email formats
	email_pattern = r'\b[\w.+-]+@[\w.-]+\.[a-zA-Z]{2,}\b'
	return re.sub(email_pattern, convert_email, text)

	@staticmethod
	def _process_websites(text: str) -> str:
	"""Process websites with correct English pronunciation for special characters"""
	def convert_website(match):
	url = match.group(1)
	# Replace each special character with its English pronunciation
	return (url.replace('.', ' dot ')
	.replace('-', ' dash ')
	.replace('_', ' underscore ')
	.replace('/', ' slash ')
	.replace('?', ' question mark ')
	.replace('=', ' equals ')
	.replace('&', ' ampersand '))

	# Only process websites that don't contain @ (to avoid conflict with emails)
	website_pattern = r'\b(?![\w.-]@)((?:https?://)?(?:www\.)?[\w.-]+\.[a-z]{2,}(?:[/?=&#][\w.-])*)\b'
	return re.sub(website_pattern, convert_website, text, flags=re.IGNORECASE)

	@staticmethod
	def _process_temperatures(text: str) -> str:
	"""Process temperatures and cardinal directions with degree symbols"""
	def temp_to_words(temp, unit):
	temp_text = TextProcessor._number_to_words(temp)
	unit = unit.upper() if unit else ''

	unit_map = {
	'C': 'degrees Celsius',
	'F': 'degrees Fahrenheit',
	'N': 'degrees north',
	'S': 'degrees south',
	'E': 'degrees east',
	'W': 'degrees west',
	'': 'degrees' # Default case for just number with degree symbol
	}
	unit_text = unit_map.get(unit, f'degrees {unit}')

	return f"{temp_text} {unit_text}"

	# Process formats like 75°F, 100°C, 15°N, 120°E
	text = re.sub(
	r'(-?\d+)°([NSEWCFnsewcf]?)',
	lambda m: temp_to_words(m.group(1), m.group(2)),
	text,
	flags=re.IGNORECASE
	)

	# Add degree symbol pronunciation when standalone
	text = re.sub(r'°', ' degrees ', text)

	return text

	@staticmethod
	def _process_measurements(text: str) -> str:
	"""Xử lý các đơn vị đo lường với số thập phân"""
	units_map = {
	'km/h': 'kilometers per hour',
	'mph': 'miles per hour',
	'kg': 'kilograms',
	'g': 'grams',
	'cm': 'centimeters',
	'm': 'meters',
	'mm': 'millimeters',
	'L': 'liters',
	'l': 'liters',
	'ml': 'milliliters',
	'mL': 'milliliters',
	'h': 'hours',
	'min': 'minutes',
	's': 'seconds'
	}

	plural_units = {'L', 'l', 'mL', 'ml'} # Các đơn vị không thêm 's' khi số nhiều

	def measurement_to_words(value, unit):
	try:
	# Xử lý số thập phân
	if '.' in value:
	integer_part, decimal_part = value.split('.')
	value_text = (f"{TextProcessor._number_to_words(integer_part)} "
	f"point {' '.join(TextProcessor._digit_to_word(d) for d in decimal_part)}")
	else:
	value_text = TextProcessor._number_to_words(value)

	# Xử lý đơn vị
	unit_lower = unit.lower()
	unit_text = units_map.get(unit, units_map.get(unit_lower, unit))

	# Xử lý số nhiều (trừ các đơn vị đặc biệt)
	if (float(value) != 1 and unit_lower in units_map
	and unit not in plural_units):
	unit_text += 's'

	return f"{value_text} {unit_text}"
	except:
	return f"{value}{unit}"

	# Xử lý định dạng 180 km/h, 60 kg, 3.5 L, 250 ml
	text = re.sub(
	r'(-?\d+\.?\d)\s({})\b'.format('\|'.join(
	re.escape(key) for key in units_map.keys()
	)),
	lambda m: measurement_to_words(m.group(1), m.group(2)),
	text,
	flags=re.IGNORECASE
	)

	return text

	@staticmethod
	def _process_currency(text: str) -> str:
	"""Xử lý các loại tiền tệ"""
	currency_map = {
	'$': 'dollars',
	'€': 'euros',
	'£': 'pounds',
	'¥': 'yen',
	'₩': 'won',
	'₽': 'rubles'
	}

	def currency_to_words(value, symbol):
	value_text = TextProcessor._number_to_words(value)
	currency_text = currency_map.get(symbol, '')
	return f"{value_text} {currency_text}" if currency_text else f"{symbol}{value}"

	# Xử lý định dạng $10, €50
	text = re.sub(
	r'([$€£¥₩₽])(\d+\.?\d*)',
	lambda m: currency_to_words(m.group(2), m.group(1)),
	text
	)

	return text

	@staticmethod
	def _process_percentages(text: str) -> str:
	"""Xử lý phần trăm"""
	text = re.sub(
	r'(\d+\.?\d*)%',
	lambda m: f"{TextProcessor._number_to_words(m.group(1))} percent",
	text
	)
	return text

	@staticmethod
	def _process_math_operations(text: str) -> str:
	"""Xử lý các phép toán"""
	math_map = {
	'+': 'plus',
	'-': 'minus',
	'×': 'times',
	'*': 'times',
	'÷': 'divided by',
	'/': 'divided by',
	'=': 'equals',
	'>': 'is greater than',
	'<': 'is less than'
	}

	# Xử lý phép toán đơn giản 2+2=4
	text = re.sub(
	r'(\d+)\s([+×÷/=><-])\s*(\d+)',
	lambda m: (f"{TextProcessor._number_to_words(m.group(1))} "
	f"{math_map.get(m.group(2), m.group(2))} "
	f"{TextProcessor._number_to_words(m.group(3))}"),
	text
	)

	# Xử lý phân số 4/5
	text = re.sub(
	r'(\d+)/(\d+)',
	lambda m: (f"{TextProcessor._number_to_words(m.group(1))} "
	f"divided by {TextProcessor._number_to_words(m.group(2))}"),
	text
	)

	return text

	@staticmethod
	def _process_special_symbols(text: str) -> str:
	"""Xử lý các ký hiệu đặc biệt"""
	symbol_map = {
	'@': 'at',
	'#': 'number',
	'&': 'and',
	'_': 'underscore'
	}

	# Xử lý @home → at home
	text = re.sub(
	r'@(\w+)',
	lambda m: f"at {m.group(1)}",
	text
	)

	# Xử lý #1 → number one
	text = re.sub(
	r'#(\d+)',
	lambda m: f"number {TextProcessor._number_to_words(m.group(1))}",
	text
	)

	# Xử lý các ký hiệu đơn lẻ
	for symbol, replacement in symbol_map.items():
	text = text.replace(symbol, f' {replacement} ')

	return text

	@staticmethod
	def _process_times(text: str) -> str:
	"""Xử lý định dạng thời gian thành cách đọc tự nhiên"""
	# Xử lý định dạng 12:30, 12:30 AM/PM
	text = re.sub(
	r'\b(\d{1,2}):(\d{2})\s*(AM\|PM\|am\|pm)?\b',
	lambda m: TextProcessor._time_to_words(m.group(1), m.group(2), m.group(3)),
	text
	)
	return text

	@staticmethod
	def _time_to_words(hour: str, minute: str, period: str = None) -> str:
	"""Chuyển thời gian thành cách đọc tự nhiên"""
	hour_int = int(hour)
	minute_int = int(minute)

	# Xử lý AM/PM
	period_text = ""
	if period:
	period_text = " AM" if period.upper() == "AM" else " PM"

	# Xử lý giờ
	if hour_int == 0:
	hour_text = "twelve"
	elif hour_int <= 12:
	hour_text = TextProcessor._number_to_words(str(hour_int))
	else:
	hour_text = TextProcessor._number_to_words(str(hour_int - 12))

	# Xử lý phút
	if minute_int == 0:
	minute_text = "o'clock"
	elif minute_int < 10:
	minute_text = "oh " + TextProcessor._number_to_words(str(minute_int))
	else:
	minute_text = TextProcessor._number_to_words(str(minute_int))

	# Kết hợp thành câu
	if minute_int == 0:
	return f"{hour_text}{period_text}"
	return f"{hour_text} {minute_text}{period_text}"

	@staticmethod
	def _process_years(text: str) -> str:
	"""Xử lý các năm trong văn bản"""
	# Xử lý năm 4 chữ số từ 1000-2999 (phổ biến nhất)
	text = re.sub(
	r'\b(1[0-9]{3}\|2[0-9]{3})\b',
	lambda m: TextProcessor._year_to_words(m.group(1)),
	text
	)

	# Xử lý năm 2 chữ số (nếu cần)
	text = re.sub(
	r'\b([0-9]{2})\b',
	lambda m: TextProcessor._two_digit_year_to_words(m.group(1)),
	text
	)

	return text

	@staticmethod
	def _year_to_words(year: str) -> str:
	"""Chuyển năm 4 chữ số thành chữ"""
	if len(year) != 4:
	return year

	# Năm từ 2000-2099 có thể đọc là "two thousand twenty-one" hoặc "twenty twenty-one"
	if year.startswith('20'):
	# Lựa chọn cách đọc phổ biến hơn
	return f"twenty {TextProcessor._two_digit_year_to_words(year[2:])}"

	# Các năm khác đọc bình thường
	return TextProcessor._number_to_words(year)

	@staticmethod
	def _two_digit_year_to_words(num: str) -> str:
	"""Chuyển số 2 chữ số thành chữ (cho năm)"""
	if len(num) != 2:
	return num

	num_int = int(num)
	if num_int == 0:
	return "zero zero"
	if num_int < 10:
	return f"oh {TextProcessor._digit_to_word(num[1])}"

	ones = ['', 'one', 'two', 'three', 'four', 'five', 'six', 'seven', 'eight', 'nine',
	'ten', 'eleven', 'twelve', 'thirteen', 'fourteen', 'fifteen', 'sixteen',
	'seventeen', 'eighteen', 'nineteen']
	tens = ['', '', 'twenty', 'thirty', 'forty', 'fifty', 'sixty', 'seventy',
	'eighty', 'ninety']

	if num_int < 20:
	return ones[num_int]

	ten, one = divmod(num_int, 10)
	if one == 0:
	return tens[ten]
	return f"{tens[ten]} {ones[one]}"

	@staticmethod
	def _process_phone_numbers(text: str) -> str:
	"""Xử lý số điện thoại với regex chính xác hơn"""
	# Pattern mới tránh xung đột với số La Mã
	phone_pattern = r'\b(\d{3})[-. ]?(\d{3})[-. ]?(\d{4})\b'

	def phone_to_words(match):
	groups = match.groups()
	# Đọc từng số trong từng nhóm và thêm dấu phẩy (,) để tạo ngắt nghỉ
	parts = []
	for part in groups:
	digits = ' '.join([TextProcessor._digit_to_word(d) for d in part])
	parts.append(digits)
	return ', '.join(parts) # Thêm dấu phẩy để tạo ngắt nghỉ khi đọc

	return re.sub(phone_pattern, phone_to_words, text)
	@staticmethod
	def _process_currency_numbers(text: str) -> str:
	return re.sub(
	r'\$?(\d{1,3}(?:,\d{3})*(?:\.\d+)?)\b',
	lambda m: f"{TextProcessor._number_to_words(m.group(1))} dollars" if '$' in m.group(0)
	else TextProcessor._number_to_words(m.group(1)),
	text
	)

	@staticmethod
	def _digit_to_word(digit: str) -> str:
	digit_map = {
	'0': 'zero', '1': 'one', '2': 'two', '3': 'three', '4': 'four',
	'5': 'five', '6': 'six', '7': 'seven', '8': 'eight', '9': 'nine'
	}
	return digit_map.get(digit, digit)

	@staticmethod
	def _number_to_words(number: str) -> str:
	num_str = number.replace(',', '')

	try:
	if '.' in num_str:
	integer_part, decimal_part = num_str.split('.')
	integer_text = TextProcessor._int_to_words(integer_part)
	decimal_text = ' '.join([TextProcessor._digit_to_word(d) for d in decimal_part])
	return f"{integer_text} point {decimal_text}"
	return TextProcessor._int_to_words(num_str)
	except:
	return number

	@staticmethod
	def _digits_to_words(digits: str) -> str:
	return ' '.join([TextProcessor._digit_to_word(d) for d in digits])

	@staticmethod
	def _int_to_words(num_str: str) -> str:
	num = int(num_str)
	if num == 0:
	return 'zero'

	units = ['', 'thousand', 'million', 'billion', 'trillion']
	words = []
	level = 0

	while num > 0:
	chunk = num % 1000
	if chunk != 0:
	words.append(TextProcessor._convert_less_than_thousand(chunk) + ' ' + units[level])
	num = num // 1000
	level += 1

	return ' '.join(reversed(words)).strip()

	@staticmethod
	def _convert_less_than_thousand(num: int) -> str:
	ones = ['', 'one', 'two', 'three', 'four', 'five', 'six', 'seven', 'eight', 'nine',
	'ten', 'eleven', 'twelve', 'thirteen', 'fourteen', 'fifteen', 'sixteen',
	'seventeen', 'eighteen', 'nineteen']
	tens = ['', '', 'twenty', 'thirty', 'forty', 'fifty', 'sixty', 'seventy',
	'eighty', 'ninety']

	if num == 0:
	return ''
	if num < 20:
	return ones[num]
	if num < 100:
	return tens[num // 10] + (' ' + ones[num % 10] if num % 10 != 0 else '')
	return ones[num // 100] + ' hundred' + (' ' + TextProcessor._convert_less_than_thousand(num % 100) if num % 100 != 0 else '')

	@staticmethod
	def split_sentences(text: str) -> List[str]:
	re_special_cases = re.compile(r'(?<!\w)([A-Z][a-z]*\.)(?=\s)')
	re_sentence_split = re.compile(r'(?<=[.!?])\s+')

	sentences = []
	for line in text.split('\n'):
	stripped = line.strip()
	if stripped:
	stripped = re_special_cases.sub(r'\1Ⓝ', stripped)
	parts = re_sentence_split.split(stripped)
	for part in parts:
	part = part.replace('Ⓝ', '')
	if part:
	sentences.append(part)
	return sentences

	@staticmethod
	def parse_dialogues(text: str, prefixes: List[str]) -> List[Tuple[str, str]]:
	"""Phân tích nội dung hội thoại với các prefix chỉ định"""
	dialogues = []
	current = None

	for line in text.split('\n'):
	line = line.strip()
	if not line:
	continue

	# Kiểm tra xem dòng có bắt đầu bằng bất kỳ prefix nào không
	found_prefix = None
	for prefix in prefixes:
	if line.lower().startswith(prefix.lower() + ':'):
	found_prefix = prefix
	break

	if found_prefix:
	if current:
	# Xử lý các trường hợp đặc biệt trước khi thêm vào dialogues
	processed_content = TextProcessor._process_special_cases(current[1])
	dialogues.append((current[0], processed_content))

	speaker = found_prefix
	content = line[len(found_prefix)+1:].strip()
	current = (speaker, content)
	elif current:
	current = (current[0], current[1] + ' ' + line)

	if current:
	# Xử lý các trường hợp đặc biệt cho dòng cuối cùng
	processed_content = TextProcessor._process_special_cases(current[1])
	dialogues.append((current[0], processed_content))

	return dialogues

	class AudioProcessor:
	@staticmethod
	def enhance_audio(audio: np.ndarray, volume: float = 1.0, pitch: float = 1.0) -> np.ndarray:
	# 1. Chuẩn hóa và bảo vệ chống clipping
	max_sample = np.max(np.abs(audio)) + 1e-8
	audio = (audio / max_sample) * 0.9 * volume # Giữ headroom 10%

	# 2. Soft clipping để tránh distortion
	audio = np.tanh(audio * 1.5) / 1.5 # Hàm tanh cho soft clipping mượt

	# 3. Chuyển sang AudioSegment với xử lý pitch
	audio_seg = AudioSegment(
	(audio * 32767).astype(np.int16).tobytes(),
	frame_rate=24000,
	sample_width=2,
	channels=1
	)

	# 4. Xử lý pitch với crossfade
	if pitch != 1.0:
	audio_seg = audio_seg._spawn(
	audio_seg.raw_data,
	overrides={"frame_rate": int(audio_seg.frame_rate * pitch)}
	).set_frame_rate(24000).fade_in(10).fade_out(10)

	# 5. Xử lý động và lọc tần
	audio_seg = compress_dynamic_range(
	audio_seg,
	threshold=-12.0,
	ratio=3.5,
	attack=5,
	release=50
	)
	audio_seg = audio_seg.low_pass_filter(11000).high_pass_filter(200)

	# 6. Chuẩn hóa an toàn
	if audio_seg.max_dBFS > -1.0:
	audio_seg = audio_seg.apply_gain(-audio_seg.max_dBFS * 0.8)

	return np.array(audio_seg.get_array_of_samples()) / 32768.0

	@staticmethod
	def calculate_pause(text: str, pause_settings: Dict[str, int]) -> int:
	"""Calculate pause duration with more precise rules"""
	text = text.strip()
	if not text:
	return 0

	# Special cases that should have no pause
	if re.search(r'(?:^\|\s)(?:Mr\|Mrs\|Ms\|Dr\|Prof\|St\|A\.M\|P\.M\|etc\|e\.g\|i\.e)\.$', text, re.IGNORECASE):
	return 0

	# Time formats (12:30) - minimal pause
	if re.search(r'\b\d{1,2}:\d{2}\b', text):
	return pause_settings.get('time_colon_pause', 50) # Default 50ms for times

	# Determine pause based on last character
	last_char = text[-1]
	return pause_settings.get(last_char, pause_settings['default_pause'])

	@staticmethod
	def combine_segments(segments: List[AudioSegment], pauses: List[int]) -> AudioSegment:
	"""Combine audio segments with frame-accurate timing"""
	combined = AudioSegment.silent(duration=0) # Start with 0 silence

	for i, (seg, pause) in enumerate(zip(segments, pauses)):
	# Apply fades without affecting duration
	seg = seg.fade_in(10).fade_out(10)

	# Add segment
	combined += seg

	# Add pause if not the last segment
	if i < len(segments) - 1:
	combined += AudioSegment.silent(duration=max(50, pause))

	return combined

	@staticmethod
	def combine_with_pauses(segments: List[AudioSegment], pauses: List[int]) -> AudioSegment:
	combined = AudioSegment.empty()
	for i, (seg, pause) in enumerate(zip(segments, pauses)):
	seg = seg.fade_in(50).fade_out(50)
	combined += seg
	if i < len(segments) - 1:
	combined += AudioSegment.silent(duration=pause)
	return combined

	class SubtitleGenerator:
	@staticmethod
	def clean_subtitle_text(text: str) -> str:
	"""Remove Q:/A:/CHARx: prefixes from subtitle text"""
	# Remove all speaker prefixes and extra spaces
	cleaned = re.sub(r'^(Q\|A\|CHAR\d+):\s*', '', text.strip())
	return cleaned

	@staticmethod
	def split_long_sentences(text: str, max_length: int = 120) -> List[str]:
	"""Split long sentences at punctuation marks while preserving meaning"""
	sentences = []
	current = ""

	# Split at punctuation first
	parts = re.split(r'([.!?])', text)

	# Recombine with punctuation but check length
	for i in range(0, len(parts)-1, 2):
	part = parts[i] + (parts[i+1] if i+1 < len(parts) else "")
	if len(current + part) <= max_length:
	current += part
	else:
	if current:
	sentences.append(current)
	current = part

	if current:
	sentences.append(current)

	return sentences

	@staticmethod
	def generate_srt(audio_segments: List[AudioSegment], sentences: List[str], pause_settings: Dict[str, int]) -> str:
	"""Generate SRT format subtitles with precise timing information"""
	subtitles = []
	current_time = 150 # Start with initial silence (150ms)
	max_subtitle_length = 120 # Maximum characters per subtitle line

	for i, (seg, sentence) in enumerate(zip(audio_segments, sentences)):

	# Split long sentences into smaller chunks at punctuation
	sentence_chunks = SubtitleGenerator.split_long_sentences(cleaned_sentence, max_subtitle_length)

	# Calculate duration per chunk (equal division for simplicity)
	chunk_duration = len(seg) / max(1, len(sentence_chunks))

	for j, chunk in enumerate(sentence_chunks):
	start_time = current_time + (j * chunk_duration)
	end_time = start_time + chunk_duration

	# Add subtitle entry
	subtitles.append({
	'start': int(start_time),
	'end': int(end_time),
	'text': chunk.strip()
	})

	# Update current time with segment duration
	current_time += len(seg)

	# Add pause if not the last segment
	if i < len(audio_segments) - 1:
	pause = AudioProcessor.calculate_pause(sentence, pause_settings)
	current_time += max(100, pause)

	# Convert to SRT format with precise timing
	srt_content = []
	for idx, sub in enumerate(subtitles, 1):
	start_time = timedelta(milliseconds=sub['start'])
	end_time = timedelta(milliseconds=sub['end'])

	# Format: 00:00:01,040 --> 00:00:09,760
	start_str = f"{start_time.total_seconds() // 3600:02.0f}:{(start_time.total_seconds() % 3600) // 60:02.0f}:{start_time.total_seconds() % 60:06.3f}".replace('.', ',')
	end_str = f"{end_time.total_seconds() // 3600:02.0f}:{(end_time.total_seconds() % 3600) // 60:02.0f}:{end_time.total_seconds() % 60:06.3f}".replace('.', ',')

	srt_content.append(
	f"{idx}\n"
	f"{start_str} --> {end_str}\n"
	f"{sub['text']}\n"
	)

	return "\n".join(srt_content)

	class TTSGenerator:
	def __init__(self):
	self.text_processor = TextProcessor()
	self.audio_processor = AudioProcessor()
	self.tokenizer = Tokenizer()
	self.subtitle_generator = SubtitleGenerator()

	def generate_sentence_audio(self, sentence: str, voice: str, speed: float,
	device: str, volume: float = 1.0, pitch: float = 1.0) -> Optional[Tuple[int, np.ndarray]]:
	try:
	# Check if voice exists
	if voice not in model_manager.voice_files:
	print(f"Voice {voice} not found in voices folder")
	return None

	# Load voice if not cached
	if voice not in model_manager.voice_cache:
	voice_path = model_manager.voice_files[voice]
	try:
	# Load the voice model file
	voice_data = torch.load(voice_path, map_location='cpu')

	# Assuming the voice file contains the necessary components for the pipeline
	pipeline = model_manager.pipelines['a'] # or 'b' depending on your needs
	pack = voice_data # or extract the relevant parts from voice_data

	model_manager.voice_cache[voice] = (pipeline, pack)
	except Exception as e:
	print(f"Error loading voice {voice}: {e}")
	return None
	else:
	pipeline, pack = model_manager.voice_cache[voice]

	# Process text
	processed_text = self.tokenizer.process_text(sentence)

	# Generate audio
	for _, ps, _ in pipeline(processed_text, voice, speed):
	ref_s = pack[len(ps)-1]

	if device == 'cuda':
	ps = ps.cuda()
	ref_s = ref_s.cuda()

	with torch.cuda.amp.autocast(enabled=(device=='cuda')):
	audio = model_manager.models[device](ps, ref_s, speed).cpu().numpy()

	return (24000, self.audio_processor.enhance_audio(audio, volume, pitch))

	except Exception as e:
	print(f"Error generating audio: {e}")
	return None

	def generate_story_audio(self, text: str, voice: str, speed: float, device: str,
	pause_settings: Dict[str, int], volume: float = 1.0, pitch: float = 1.0) -> Tuple[Tuple[int, np.ndarray], str, str]:
	start_time = time.time()
	clean_text = self.text_processor.clean_text(text)
	sentences = self.text_processor.split_sentences(clean_text)

	if not sentences:
	return None, "No content to read", ""

	audio_segments = []
	pause_durations = []

	# Adjust pause settings based on speed (more precise calculation)
	speed_factor = max(0.5, min(2.0, speed)) # Clamp speed factor
	adjusted_pause_settings = {
	'default_pause': int(pause_settings['default_pause'] / speed_factor),
	'dot_pause': int(pause_settings['dot_pause'] / speed_factor),
	'ques_pause': int(pause_settings['ques_pause'] / speed_factor),
	'comma_pause': int(pause_settings['comma_pause'] / speed_factor),
	'colon_pause': int(pause_settings['colon_pause'] / speed_factor),
	'excl_pause': int(pause_settings['dot_pause'] / speed_factor),
	'semi_pause': int(pause_settings['colon_pause'] / speed_factor),
	'dash_pause': int(pause_settings['comma_pause'] / speed_factor),
	'time_colon_pause': 50 # Fixed short pause for time formats
	}

	# Generate each audio segment
	for sentence in sentences:
	result = self.generate_sentence_audio(sentence, voice, speed, device, volume, pitch)
	if not result:
	continue

	sample_rate, audio_data = result
	audio_seg = AudioSegment(
	(audio_data * 32767).astype(np.int16).tobytes(),
	frame_rate=sample_rate,
	sample_width=2,
	channels=1
	)
	audio_segments.append(audio_seg)

	# Calculate precise pause duration
	pause = self.audio_processor.calculate_pause(sentence, adjusted_pause_settings)
	pause_durations.append(pause)

	if not audio_segments:
	return None, "Failed to generate audio", ""

	# Combine with frame-accurate timing
	combined_audio = self.audio_processor.combine_segments(audio_segments, pause_durations)

	# Export with precise timing
	with io.BytesIO() as buffer:
	combined_audio.export(buffer, format="mp3", bitrate="256k", parameters=["-ar", str(combined_audio.frame_rate)])
	buffer.seek(0)
	audio_data = np.frombuffer(buffer.read(), dtype=np.uint8)

	# Generate subtitles with the same timing used for audio
	subtitles = self.subtitle_generator.generate_srt(audio_segments, sentences, adjusted_pause_settings)

	stats = (f"Processed {len(clean_text)} chars, {len(clean_text.split())} words\n"
	f"Audio duration: {len(combined_audio)/1000:.2f}s\n"
	f"Time: {time.time() - start_time:.2f}s\n"
	f"Device: {device.upper()}")

	return (combined_audio.frame_rate, audio_data), stats, subtitles

	def create_interface():
	css = """
	.gradio-container { max-width: 1000px !important; }
	.audio-output { height: 300px !important; }
	.advanced-settings { background-color: #f5f5f5; padding: 15px; border-radius: 5px; }
	.tab { min-height: 500px; }
	.qa-example { font-family: monospace; white-space: pre; background-color: #f8f9fa; padding: 10px; border-radius: 5px; }
	.char-settings { display: grid; grid-template-columns: repeat(4, 1fr); gap: 10px; margin-bottom: 15px; }
	.char-settings .voice-select { min-width: 150px; }
	.char-settings .speed-slider { min-width: 120px; }
	.subtitle-output { max-height: 300px; overflow-y: auto; }
	.download-btn { margin-top: 10px; }
	"""

	with gr.Blocks(title="Advanced Multi-Character TTS", css=css) as app:
	gr.Markdown("## 🎙️ Advanced TTS with Multi-Character Dialogue & Subtitles")

	with gr.Tabs():
	with gr.TabItem("Standard Mode", elem_classes="tab"):
	with gr.Row():
	with gr.Column():
	phonemization_toggle = gr.Checkbox(
	label="Enable Advanced Phonemization",
	value=False,
	info="Improve pronunciation but may affect performance"
	)
	text_input = gr.Textbox(
	label="Input Text",
	value="Contact us at info@example.com or call 012-345-6789. Our website is https://www.example.com",
	lines=7
	)

	with gr.Accordion("Voice Settings", open=True):
	voice = gr.Dropdown(
	label="Select Voice",
	choices=model_manager.get_voice_list(),
	value=model_manager.get_voice_list()[0] if model_manager.get_voice_list() else None
	)
	with gr.Row():
	speed = gr.Slider(
	label="Speed",
	minimum=0.7,
	maximum=1.3,
	value=1.0,
	step=0.05
	)
	volume = gr.Slider(
	label="Volume",
	minimum=0.5,
	maximum=2.0,
	value=2.0,
	step=0.1
	)
	pitch = gr.Slider(
	label="Pitch",
	minimum=0.8,
	maximum=1.2,
	value=1.0,
	step=0.05
	)
	device = gr.Radio(
	label="Processing Device",
	choices=["GPU 🚀" if CUDA_AVAILABLE else "GPU (Not Available)", "CPU"],
	value="GPU 🚀" if CUDA_AVAILABLE else "CPU"
	)

	with gr.Accordion("Pause Settings (ms)", open=False):
	with gr.Row():
	default_pause = gr.Slider(0, 2000, 200, label="Default")
	dot_pause = gr.Slider(0, 3000, 600, label="Period (.)")
	ques_pause = gr.Slider(0, 3000, 800, label="Question (?)")
	with gr.Row():
	comma_pause = gr.Slider(0, 1500, 300, label="Comma (,)")
	colon_pause = gr.Slider(0, 2000, 400, label="Colon (:)")

	generate_btn = gr.Button("Generate Speech", variant="primary")

	with gr.Column():
	audio_output = gr.Audio(label="Output Audio", elem_classes="audio-output")
	stats_output = gr.Textbox(label="Processing Stats", lines=4)
	subtitle_output = gr.Textbox(label="Subtitles (.srt format)", lines=10, elem_classes="subtitle-output")
	download_btn = gr.Button("Download SRT File", elem_classes="download-btn")
	gr.Examples(
	examples=[
	["Call 123-456-7890 for support"],
	["Email me at john.doe@company.com"],
	["Visit https://example.org for more info"],
	["The price is $1,234.56"]
	],
	inputs=text_input,
	label="Special Format Examples"
	)

	generator = TTSGenerator()

	def generate(text, voice, speed, volume, pitch, device, default_pause, dot_pause, ques_pause, comma_pause, colon_pause):
	device = "cuda" if "GPU" in device and CUDA_AVAILABLE else "cpu"

	pause_settings = {
	'default_pause': default_pause,
	'dot_pause': dot_pause,
	'ques_pause': ques_pause,
	'comma_pause': comma_pause,
	'colon_pause': colon_pause,
	'excl_pause': dot_pause,
	'semi_pause': colon_pause,
	'dash_pause': comma_pause,
	'time_colon_pause': 0
	}

	result, stats, subtitles = generator.generate_story_audio(
	text, voice, speed, device, pause_settings, volume, pitch
	)

	if result:
	sample_rate, audio_data = result
	filepath = "/tmp/output.mp3"
	with open(filepath, "wb") as f:
	f.write(audio_data.tobytes())

	# Save SRT file
	srt_path = "/tmp/subtitles.srt"
	with open(srt_path, "w") as f:
	f.write(subtitles)

	return filepath, stats, subtitles, srt_path
	return None, stats, "", None

	# Store SRT file paths
	srt_file = gr.State()

	generate_btn.click(
	fn=generate,
	inputs=[text_input, voice, speed, volume, pitch, device, default_pause, dot_pause, ques_pause, comma_pause, colon_pause],
	outputs=[audio_output, stats_output, subtitle_output, srt_file]
	)

	# Download button handlers
	download_btn.click(
	fn=lambda srt_path: srt_path if srt_path else None,
	inputs=[srt_file],
	outputs=gr.File(label="Download SRT File")
	)

	return app

	if __name__ == "__main__":
	app = create_interface()
	app.launch(server_name="0.0.0.0", server_port=7860)