Spaces:

Shirochi
/

Glossarion

Running

App Files Files Community

Glossarion / discord_bot.py

Shirochi

Upload 93 files

ec038f4 verified about 2 months ago

raw

history blame contribute delete

128 kB

	#!/usr/bin/env python3
	"""
	Glossarion Discord Bot
	Translate files via Discord using your existing Glossarion installation

	PDF Formatting Integration:
	- When processing PDF files, the bot automatically uses the pdf_extractor module
	- The pdf_extractor.generate_css_from_pdf() function detects and extracts:
	* base_font_size: The median font size from the PDF body text
	* font_family: The most common font family (mapped to web-safe fonts)
	* text_align: The predominant text alignment (left, center, right, justify)
	* line_height_ratio: The calculated line spacing ratio
	- These variables are automatically applied during PDF -> HTML conversion
	- No manual configuration needed - styling is preserved from the original PDF
	"""

	import discord
	from discord import app_commands
	from discord.ext import commands
	import os
	import sys
	import asyncio
	import tempfile
	import shutil
	import json
	import logging
	import time
	import uuid
	import functools
	import base64
	import hashlib
	from urllib.parse import quote as urlquote
	from typing import Optional

	import requests
	from aiohttp import web
	from cryptography.fernet import Fernet

	# Add src directory to path
	# In this repo layout, `discord_bot.py` typically lives inside the `src/` directory.
	# Older deployments may have a nested `src/src` structure, so detect the correct one.
	_base_dir = os.path.dirname(__file__)
	_nested_src_dir = os.path.join(_base_dir, "src")

	if os.path.isdir(_nested_src_dir) and os.path.exists(os.path.join(_nested_src_dir, "config.json")):
	src_dir = _nested_src_dir
	else:
	src_dir = _base_dir

	sys.path.insert(0, src_dir)

	PROJECT_ROOT = os.path.dirname(src_dir)
	HOSTED_FILES_DIR = os.path.join(PROJECT_ROOT, "hosted_files")
	HOSTED_TTL_SECONDS = 24 * 60 * 60 # 24 hours
	HOSTED_MAX_BYTES = 5 * 1024 * 1024 * 1024 # 5 GB
	MAX_DISCORD_UPLOAD = 10 * 1024 * 1024 # 10 MB
	FILE_HOST_PORT = int(os.getenv("FILE_HOST_PORT", "8080"))
	FILE_HOST_BASE_URL = (os.getenv("FILE_HOST_BASE_URL") or f"http://localhost:{FILE_HOST_PORT}").rstrip("/")
	GOFILE_TOKEN = os.getenv("GOFILE_TOKEN")
	ORACLE_PAR_BASE = os.getenv("ORACLE_PAR_BASE", "") # PAR base ending with /o/
	USER_CONFIG_DIR = os.path.join(PROJECT_ROOT, "bot_user_configs")

	_file_host_runner: Optional[web.AppRunner] = None
	_file_host_site: Optional[web.TCPSite] = None
	_file_host_started = False


	def _safe_filename(name: str) -> str:
	name = os.path.basename(name or "file")
	keep = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_."
	cleaned = ''.join(ch if ch in keep else '_' for ch in name)
	return cleaned or "file"


	def _cleanup_hosted_files() -> int:
	"""Remove expired files and enforce the 5GB cap. Returns current total bytes."""
	os.makedirs(HOSTED_FILES_DIR, exist_ok=True)
	now = time.time()
	entries = [] # (mtime, size, path)
	total = 0
	for fname in list(os.listdir(HOSTED_FILES_DIR)):
	path = os.path.join(HOSTED_FILES_DIR, fname)
	try:
	st = os.stat(path)
	except FileNotFoundError:
	continue
	if not os.path.isfile(path):
	continue
	# Drop empty files proactively
	if st.st_size <= 0 or now - st.st_mtime > HOSTED_TTL_SECONDS:
	try:
	os.remove(path)
	except Exception:
	pass
	continue
	total += st.st_size
	entries.append((st.st_mtime, st.st_size, path))

	# Enforce quota by deleting oldest first
	if total > HOSTED_MAX_BYTES:
	entries.sort(key=lambda t: t[0]) # oldest first
	for mtime, size, path in entries:
	if total <= HOSTED_MAX_BYTES:
	break
	try:
	os.remove(path)
	total -= size
	except Exception:
	continue
	return total


	def _hosted_download_url(stored_name: str) -> str:
	return f"{FILE_HOST_BASE_URL}/files/{urlquote(stored_name)}"


	def _ensure_space(effective_bytes: int) -> None:
	total = _cleanup_hosted_files()
	if effective_bytes > HOSTED_MAX_BYTES:
	raise ValueError("File exceeds 5GB host capacity")
	if total + effective_bytes <= HOSTED_MAX_BYTES:
	return

	# Delete oldest files until there is room
	entries = []
	for fname in list(os.listdir(HOSTED_FILES_DIR)):
	path = os.path.join(HOSTED_FILES_DIR, fname)
	try:
	st = os.stat(path)
	except Exception:
	continue
	if not os.path.isfile(path):
	continue
	entries.append((st.st_mtime, st.st_size, path))
	entries.sort(key=lambda t: t[0])
	for mtime, size, path in entries:
	if total + effective_bytes <= HOSTED_MAX_BYTES:
	break
	try:
	os.remove(path)
	total -= size
	except Exception:
	continue
	if total + effective_bytes > HOSTED_MAX_BYTES:
	raise ValueError("Insufficient space in hosted storage (5GB cap)")


	def _store_hosted_file(file_path: str, display_name: str, *, send_zip: bool) -> str:
	file_size = os.path.getsize(file_path)
	effective_size = file_size * (2 if send_zip else 1)
	_ensure_space(effective_size)

	safe_name = _safe_filename(display_name)
	stored_name = f"{int(time.time())}_{uuid.uuid4().hex[:8]}_{safe_name}"
	dest_path = os.path.join(HOSTED_FILES_DIR, stored_name)
	shutil.copy2(file_path, dest_path)
	return stored_name


	async def _ensure_file_host_server():
	global _file_host_runner, _file_host_site, _file_host_started
	if _file_host_started:
	return

	async def serve_file(request: web.Request):
	fname = request.match_info.get("name", "")
	# Prevent path traversal
	safe = _safe_filename(fname)
	if safe != fname:
	raise web.HTTPNotFound()
	path = os.path.join(HOSTED_FILES_DIR, fname)
	if not os.path.isfile(path):
	raise web.HTTPNotFound()
	return web.FileResponse(path)

	os.makedirs(HOSTED_FILES_DIR, exist_ok=True)
	app = web.Application()
	app.add_routes([web.get('/files/{name}', serve_file)])

	_file_host_runner = web.AppRunner(app)
	await _file_host_runner.setup()
	_file_host_site = web.TCPSite(_file_host_runner, host='0.0.0.0', port=FILE_HOST_PORT)
	await _file_host_site.start()
	_file_host_started = True
	sys.stderr.write(f"[FILE HOST] Serving {HOSTED_FILES_DIR} at {FILE_HOST_BASE_URL}/files/<name>\n")
	sys.stderr.flush()


	def _effective_discord_size(bytes_len: int, send_zip: bool) -> int:
	return int(bytes_len * (2 if send_zip else 1))

	def _should_offload(bytes_len: int, send_zip: bool) -> bool:
	return _effective_discord_size(bytes_len, send_zip) > MAX_DISCORD_UPLOAD


	def _offload_path_blocking(file_path: str, display_name: str, *, send_zip: bool) -> str:
	stored_name = _store_hosted_file(file_path, display_name, send_zip=send_zip)
	return _hosted_download_url(stored_name)


	def _upload_to_oracle_par(path: str, display_name: str \| None) -> str:
	base = ORACLE_PAR_BASE
	if not base:
	raise RuntimeError("ORACLE_PAR_BASE not set")
	base = base.rstrip('/') + '/'
	fname = display_name or os.path.basename(path)
	url = base + requests.utils.quote(fname)
	with open(path, "rb") as f:
	resp = requests.put(url, data=f, headers={"Content-Type": "application/octet-stream"}, timeout=180)
	if resp.status_code not in (200, 201, 204):
	raise RuntimeError(f"Oracle upload failed HTTP {resp.status_code}: {resp.text[:200]}")
	return url


	def _upload_to_tmpfiles(path: str, display_name: str \| None) -> str:
	fname = display_name or os.path.basename(path)
	with open(path, "rb") as f:
	files = {"file": (fname, f, "application/octet-stream")}
	resp = requests.post("https://tmpfiles.org/api/v1/upload", files=files, timeout=60)
	if resp.status_code != 200:
	raise RuntimeError(f"tmpfiles HTTP {resp.status_code}")
	try:
	data = resp.json()
	except Exception:
	data = {}
	link = data.get("data", {}).get("url") if isinstance(data.get("data"), dict) else None
	if not link:
	text = resp.text.strip()
	if text.startswith("http"):
	link = text
	if not link:
	raise RuntimeError(f"tmpfiles response invalid: {resp.text[:200]}")
	return link


	def _upload_to_tempsh(path: str, display_name: str \| None) -> str:
	fname = display_name or os.path.basename(path)
	with open(path, "rb") as f:
	files = {"file": (fname, f, "application/octet-stream")}
	resp = requests.post("https://temp.sh/upload", files=files, timeout=60)
	if resp.status_code != 200:
	raise RuntimeError(f"temp.sh HTTP {resp.status_code}")
	link = resp.text.strip()
	if not link.startswith("http"):
	raise RuntimeError(f"temp.sh response invalid: {link[:200]}")
	return link


	def _upload_to_gofile(path: str, display_name: str \| None) -> str:
	"""Upload file to Gofile and return a direct link."""
	server_resp = requests.get("https://api.gofile.io/getServer", timeout=15)
	server_json = server_resp.json()
	server = server_json.get("data", {}).get("server")
	if not server:
	raise RuntimeError("Failed to get Gofile server")

	name = display_name or os.path.basename(path)
	with open(path, "rb") as f:
	files = {"file": (name, f, "application/octet-stream")}
	headers = {"Authorization": f"Bearer {GOFILE_TOKEN}"} if GOFILE_TOKEN else {}
	upload_resp = requests.post(f"https://{server}.gofile.io/uploadFile",
	files=files,
	headers=headers,
	timeout=300)
	data = upload_resp.json()
	if upload_resp.status_code != 200 or data.get("status") != "ok":
	raise RuntimeError(f"Gofile upload failed: {data}")
	link = data.get("data", {}).get("directLink") or data.get("data", {}).get("downloadPage")
	if not link:
	raise RuntimeError("Gofile response missing link")
	return link


	def _pick_bot_tmpdir() -> str:
	"""Pick a temp directory that exists and is writable.

	Some hosts run with TMPDIR/TEMP pointing at a directory that can disappear
	(e.g. cleaned up between runs). tempfile.mkdtemp() will then raise
	FileNotFoundError: [Errno 2] No such file or directory.

	We prefer a stable project-local directory to avoid that class of failure.
	"""
	candidates = []

	# User override
	override = (os.getenv("GLOSSARION_BOT_TMPDIR") or "").strip()
	if override:
	candidates.append(override)

	# Project-local temp dir (most stable)
	try:
	project_root = os.path.dirname(src_dir)
	candidates.append(os.path.join(project_root, "bot_tmp"))
	except Exception:
	pass

	# System temp fallbacks
	for k in ("TMPDIR", "TEMP", "TMP"):
	v = (os.getenv(k) or "").strip()
	if v:
	candidates.append(v)

	# Common unix temp dirs
	candidates.extend(["/tmp", "/var/tmp"])

	# Last resort: current working directory
	try:
	candidates.append(os.getcwd())
	except Exception:
	pass

	for d in candidates:
	try:
	os.makedirs(d, exist_ok=True)
	if os.path.isdir(d) and os.access(d, os.W_OK):
	return d
	except Exception:
	continue

	# If everything fails, let tempfile decide (may still error, but nothing else we can do here)
	return ""


	BOT_TMPDIR = _pick_bot_tmpdir()
	if BOT_TMPDIR:
	sys.stderr.write(f"[CONFIG] Bot temp dir: {BOT_TMPDIR}\n")
	sys.stderr.flush()

	# Ensure all stdlib tempfile users (and many third-party libs) use the stable temp root.
	try:
	tempfile.tempdir = BOT_TMPDIR
	except Exception:
	pass

	def _ensure_stable_cwd() -> None:
	"""Ensure process CWD exists and tempfile has a stable base directory.

	On some hosts, TMPDIR can point at a directory that gets cleaned up, and the process CWD can
	also become invalid if something chdir()'d into a temp dir that later disappears.

	When that happens, unrelated code can start failing with:
	FileNotFoundError: [Errno 2] No such file or directory

	We recover by:
	- chdir() to the project root if CWD is missing
	- proactively avoiding running inside volatile temp directories
	- re-asserting TMPDIR + tempfile.tempdir to a stable directory
	"""

	project_root = os.path.dirname(src_dir)

	def _is_within(child: str, parent: str) -> bool:
	try:
	child_abs = os.path.abspath(child)
	parent_abs = os.path.abspath(parent)
	return os.path.commonpath([child_abs, parent_abs]) == parent_abs
	except Exception:
	return False

	# Ensure CWD exists
	try:
	cwd = os.getcwd()
	except FileNotFoundError:
	try:
	os.chdir(project_root)
	cwd = os.getcwd()
	except Exception:
	cwd = ""

	# Even if CWD exists, don't run inside a temp root (process-wide chdir() is a footgun).
	try:
	if cwd and BOT_TMPDIR and _is_within(cwd, BOT_TMPDIR):
	os.chdir(project_root)
	except Exception:
	pass

	# Re-assert stable tempdir (helps libraries that call tempfile.gettempdir())
	try:
	if BOT_TMPDIR:
	os.makedirs(BOT_TMPDIR, exist_ok=True)
	os.environ['TMPDIR'] = BOT_TMPDIR
	tempfile.tempdir = BOT_TMPDIR
	except Exception:
	pass


	# Ensure our process isn't running with a deleted working directory at startup.
	_ensure_stable_cwd()

	# Import Glossarion modules
	try:
	# Core translation modules
	import TransateKRtoEN
	import extract_glossary_from_epub
	import extract_glossary_from_txt
	from model_options import get_model_options
	from api_key_encryption import decrypt_config

	# File processing modules
	import pdf_extractor
	import epub_converter
	import enhanced_text_extractor
	import txt_processor

	# Glossary management
	import GlossaryManager
	import glossary_compressor

	# Chapter and text processing
	import chapter_splitter
	import Chapter_Extractor
	import chapter_extraction_manager

	# API and client modules
	import unified_api_client
	try:
	import async_api_processor
	except ImportError:
	async_api_processor = None
	import multi_api_key_manager

	# Utility modules
	import history_manager
	try:
	import metadata_batch_translator
	except ImportError:
	metadata_batch_translator = None
	import google_free_translate

	# Duplicate detection
	import advanced_duplicate_detection
	import duplicate_detection_config

	# Image translation (may not be used in Discord but import for completeness)
	try:
	import image_translator
	except ImportError:
	image_translator = None
	try:
	import manga_translator
	except ImportError:
	manga_translator = None
	try:
	import manga_integration
	except ImportError:
	manga_integration = None

	# Don't import GUI modules - they require Qt/PySide6
	# (translator_gui, GlossaryManager_GUI, QA_Scanner_GUI, etc.)

	GLOSSARION_AVAILABLE = True
	glossary_main = extract_glossary_from_epub.main
	except ImportError as e:
	GLOSSARION_AVAILABLE = False
	glossary_main = None
	print(f"⚠️ Glossarion modules not available: {e}")
	def decrypt_config(c):
	return c

	# Config file
	CONFIG_FILE = os.path.join(src_dir, "config.json")

	# Default prompt profiles used as a fallback when config.json cannot be read
	# or does not contain prompt_profiles. Keep Universal first for clarity.
	DEFAULT_PROMPT_PROFILES = [
	"Universal",
	"korean_TXT",
	"japanese_TXT",
	"chinese_TXT",
	"korean_OCR",
	"japanese_OCR",
	"chinese_OCR",
	"Manga_KR",
	"Manga_JP",
	"Manga_CN",
	"korean",
	"japanese",
	"chinese",
	"Original",
	"korean2",
	"Manga_JP_1",
	"nano banna",
	"test",
	"refinement",
	]

	# Bot setup
	intents = discord.Intents.default()
	intents.message_content = True
	bot = commands.Bot(command_prefix="/", intents=intents)


	class _SuppressExpectedAutocompleteErrors(logging.Filter):
	"""Suppress noisy, expected autocomplete failures.

	Discord autocomplete interactions are short-lived and are frequently cancelled/expired
	while a user types. When that happens, responding with autocomplete choices can raise:
	- 10062 Unknown interaction
	- 40060 Interaction has already been acknowledged

	These are not actionable for us and just spam logs.
	"""

	def filter(self, record: logging.LogRecord) -> bool:
	try:
	if record.name != "discord.app_commands.tree":
	return True

	# Only filter the specific "Ignoring exception in autocomplete" log lines.
	msg = record.getMessage() or ""
	if "Ignoring exception in autocomplete" not in msg:
	return True

	exc = None
	if record.exc_info and len(record.exc_info) >= 2:
	exc = record.exc_info[1]

	if isinstance(exc, discord.NotFound) and getattr(exc, "code", None) == 10062:
	return False

	if isinstance(exc, discord.HTTPException) and getattr(exc, "code", None) == 40060:
	return False

	return True
	except Exception:
	# Never break logging.
	return True


	# Install the filter early so it applies as soon as CommandTree logs anything.
	logging.getLogger("discord.app_commands.tree").addFilter(_SuppressExpectedAutocompleteErrors())

	# Global storage for translation state
	translation_states = {}

	# ---- Per-user config helpers ----
	def _user_config_path(user_id: int) -> str:
	return os.path.join(USER_CONFIG_DIR, f"{user_id}.json")


	def load_user_config(user_id: int) -> dict:
	try:
	path = _user_config_path(user_id)
	with open(path, "r", encoding="utf-8") as f:
	return json.load(f)
	except Exception:
	return {}


	def save_user_config(user_id: int, payload: dict) -> None:
	try:
	os.makedirs(USER_CONFIG_DIR, exist_ok=True)
	cfg = load_user_config(user_id)
	cfg.update(payload)
	with open(_user_config_path(user_id), "w", encoding="utf-8") as f:
	json.dump(cfg, f, ensure_ascii=False, indent=2)
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to save user config for {user_id}: {e}\n")
	sys.stderr.flush()

	def _derive_user_cipher(user_id: int, passphrase: Optional[str], salt: str) -> Fernet:
	"""Derive a Fernet cipher for a user from passphrase or USER_CFG_MASTER_KEY."""
	key_source = (passphrase or os.getenv("USER_CFG_MASTER_KEY") or "").strip()
	if not key_source:
	raise ValueError(
	"No passphrase provided and USER_CFG_MASTER_KEY is not set. "
	"Set a passphrase or configure USER_CFG_MASTER_KEY to unlock saved credentials."
	)
	salt_bytes = (salt or "").encode("utf-8")
	material = hashlib.sha256(
	key_source.encode("utf-8") + b":" + str(user_id).encode("utf-8") + b":" + salt_bytes
	).digest()
	return Fernet(base64.urlsafe_b64encode(material))


	def _encrypt_user_secret(user_id: int, payload: dict, passphrase: Optional[str]) -> dict:
	"""Encrypt a payload for a specific user."""
	salt = base64.urlsafe_b64encode(os.urandom(16)).decode()
	cipher = _derive_user_cipher(user_id, passphrase, salt)
	token = cipher.encrypt(json.dumps(payload).encode("utf-8")).decode()
	return {
	"ciphertext": token,
	"salt": salt,
	"uses_passphrase": bool(passphrase),
	"created_at": int(time.time()),
	}


	def _decrypt_user_secret(user_id: int, blob: dict, passphrase: Optional[str]) -> dict:
	"""Decrypt a per-user payload."""
	if not blob or not isinstance(blob, dict):
	return {}
	salt = blob.get("salt") or ""
	token = blob.get("ciphertext")
	if not token:
	return {}
	cipher = _derive_user_cipher(user_id, passphrase, salt)
	data = cipher.decrypt(token.encode("utf-8"))
	return json.loads(data.decode("utf-8"))


	def _parse_multi_key_block(raw: Optional[str], model: Optional[str]) -> list:
	"""Parse up to 50 API keys (one per line) into multi_api_keys entries."""
	keys = []
	if not raw:
	return keys
	for line in raw.splitlines():
	key = line.strip()
	if not key:
	continue
	entry = {"api_key": key, "model": (model or "").strip() or "gpt-4o", "enabled": True}
	keys.append(entry)
	if len(keys) >= 50:
	break
	return keys


	def load_saved_credentials(user_id: int, passphrase: Optional[str]) -> Optional[dict]:
	"""Return decrypted saved credentials for user, if present."""
	cfg = load_user_config(user_id)
	blob = cfg.get("credentials") or None
	if not blob:
	return None
	try:
	return _decrypt_user_secret(user_id, blob, passphrase)
	except ValueError:
	# Bubble up missing passphrase/master key errors
	raise
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to decrypt credentials for {user_id}: {e}\n")
	sys.stderr.flush()
	return None


	def _ephemeral(interaction: discord.Interaction) -> bool:
	"""Use ephemeral responses in guilds; in DMs, send normal messages."""
	return interaction.guild is not None


	async def _safe_defer(interaction: discord.Interaction, *, ephemeral: bool) -> bool:
	"""Acknowledge a slash-command interaction ASAP.

	Discord requires an initial acknowledgement quickly (or the interaction expires).
	We defer immediately, then we can safely edit the original response.

	Returns True if we successfully acknowledged, False if the interaction is already gone.
	"""
	try:
	if interaction.response.is_done():
	return True
	await interaction.response.defer(ephemeral=ephemeral)
	return True
	except discord.NotFound as e:
	if getattr(e, "code", None) == 10062:
	return False
	raise
	except discord.HTTPException as e:
	if getattr(e, "code", None) in (10062, 40060):
	return False
	raise


	async def _safe_edit_original_response(
	interaction: discord.Interaction,
	*,
	content: Optional[str] = None,
	embed: Optional[discord.Embed] = None,
	view: Optional[discord.ui.View] = None,
	):
	try:
	return await interaction.edit_original_response(content=content, embed=embed, view=view)
	except discord.NotFound as e:
	if getattr(e, "code", None) == 10062:
	return None
	raise
	except discord.HTTPException as e:
	if getattr(e, "code", None) in (10062, 40060):
	return None
	raise


	async def _safe_send_message(
	interaction: discord.Interaction,
	content: Optional[str] = None,
	*,
	embed: Optional[discord.Embed] = None,
	ephemeral: bool = False,
	**kwargs,
	):
	"""Send a message for an interaction without crashing on common interaction races.

	NOTE: discord.NotFound (10062) is a subclass of discord.HTTPException, so we must
	handle it before the generic HTTPException handler.

	Returns a discord.Message when possible, otherwise None.
	"""
	try:
	if interaction.response.is_done():
	return await interaction.followup.send(
	content=content,
	embed=embed,
	ephemeral=ephemeral,
	wait=True,
	**kwargs,
	)

	await interaction.response.send_message(
	content=content,
	embed=embed,
	ephemeral=ephemeral,
	**kwargs,
	)
	try:
	return await interaction.original_response()
	except Exception:
	return None

	except discord.NotFound as e:
	# Interaction expired/cancelled (common under load).
	if getattr(e, "code", None) == 10062:
	return None
	raise

	except discord.HTTPException as e:
	# If the interaction was already acknowledged, fall back to followup.
	if getattr(e, "code", None) == 40060:
	try:
	return await interaction.followup.send(
	content=content,
	embed=embed,
	ephemeral=ephemeral,
	wait=True,
	**kwargs,
	)
	except Exception:
	return None

	# Some platforms return 10062 as HTTPException; treat it as non-fatal.
	if getattr(e, "code", None) == 10062:
	return None

	raise


	class LogView(discord.ui.View):
	"""View with buttons to toggle log display and stop translation"""
	def __init__(self, user_id: int):
	super().__init__(timeout=None) # No timeout for persistent view
	self.user_id = user_id

	@discord.ui.button(label="Show More Logs", style=discord.ButtonStyle.secondary, emoji="🔽", custom_id="toggle_logs")
	async def toggle_logs(self, interaction: discord.Interaction, button: discord.ui.Button):
	"""Toggle between compact and full log view"""
	state = translation_states.get(self.user_id)
	if not state:
	await _safe_send_message(interaction, "❌ Translation session expired", ephemeral=_ephemeral(interaction))
	return

	try:
	# Toggle the state
	state['show_full'] = not state.get('show_full', False)

	# Update button label
	if state['show_full']:
	button.label = "Show Less"
	button.emoji = "🔼"
	else:
	button.label = "Show More Logs"
	button.emoji = "🔽"

	# Get log text based on current state
	logs = state.get('logs', [])
	if state['show_full']:
	log_text = '\n'.join(logs)
	if len(log_text) > 3900:
	log_text = "..." + log_text[-3900:]
	else:
	log_text = '\n'.join(logs[-10:])
	if len(log_text) > 800:
	log_text = log_text[-800:]

	if not log_text:
	log_text = "No logs yet..."

	embed = discord.Embed(
	title="📚 Translation in Progress",
	description=f"Status: Processing... ({len(logs)} logs)\n\n```{log_text}```",
	color=discord.Color.blue()
	)

	await interaction.response.edit_message(embed=embed, view=self)
	except Exception as e:
	sys.stderr.write(f"[BUTTON ERROR] {e}\n")
	try:
	await _safe_send_message(interaction, f"❌ Error: {e}", ephemeral=_ephemeral(interaction))
	except:
	pass

	@discord.ui.button(label="Stop Translation", style=discord.ButtonStyle.danger, emoji="⏹️", custom_id="stop_translation")
	async def stop_translation(self, interaction: discord.Interaction, button: discord.ui.Button):
	"""Stop the translation process"""
	state = translation_states.get(self.user_id)
	if not state:
	await _safe_send_message(interaction, "❌ Translation session expired", ephemeral=_ephemeral(interaction))
	return

	try:
	state['stop_requested'] = True
	button.disabled = True
	button.label = "Stopped"
	button.style = discord.ButtonStyle.secondary

	await interaction.response.edit_message(view=self)
	await interaction.followup.send("⏹️ Translation stop requested...", ephemeral=_ephemeral(interaction))
	except Exception as e:
	sys.stderr.write(f"[BUTTON ERROR] {e}\n")
	try:
	await _safe_send_message(interaction, f"❌ Error: {e}", ephemeral=_ephemeral(interaction))
	except:
	pass


	def load_config():
	"""Load Glossarion config (decrypted)"""
	search_paths = [
	CONFIG_FILE,
	os.path.join(PROJECT_ROOT, "config.json"),
	os.path.join(os.getcwd(), "config.json"),
	]

	for path in search_paths:
	try:
	with open(path, 'r', encoding='utf-8') as f:
	config = json.load(f)
	config = decrypt_config(config)
	# Remember which config file we actually used (debugging aid)
	config["_source_config"] = path
	return config
	except FileNotFoundError:
	continue
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to load {path}: {e}\n")
	sys.stderr.flush()

	sys.stderr.write("[CONFIG] No config.json found in expected locations; using empty config\n")
	sys.stderr.flush()
	return {}


	@bot.event
	async def on_ready():
	print(f"✅ {bot.user} is online!")
	try:
	synced = await bot.tree.sync()
	print(f"✅ Synced {len(synced)} command(s)")
	except Exception as e:
	import traceback
	print(f"❌ Failed to sync commands: {e}")
	traceback.print_exc()


	async def model_autocomplete(interaction: discord.Interaction, current: str):
	"""Autocomplete for model selection - shows popular models from model_options.py"""
	if GLOSSARION_AVAILABLE:
	try:
	all_models = get_model_options()
	# Filter models that match current input
	if current:
	matches = [m for m in all_models if current.lower() in m.lower()]
	else:
	# Show popular models first when no input
	popular = ['gpt-4', 'gpt-4-turbo', 'gpt-4o', 'claude-3-5-sonnet', 'claude-3-opus',
	'gemini-2.0-flash-exp', 'gemini-1.5-pro', 'deepseek-chat']
	matches = [m for m in popular if m in all_models] + all_models[:15]

	# Return up to 25 choices (Discord limit)
	return [app_commands.Choice(name=m, value=m) for m in matches[:25]]
	except:
	pass

	# Fallback choices if model_options unavailable
	return [
	app_commands.Choice(name="gpt-4", value="gpt-4"),
	app_commands.Choice(name="gpt-4-turbo", value="gpt-4-turbo"),
	app_commands.Choice(name="claude-3-5-sonnet", value="claude-3-5-sonnet"),
	app_commands.Choice(name="gemini-2.0-flash-exp", value="gemini-2.0-flash-exp"),
	]


	async def profile_autocomplete(interaction: discord.Interaction, current: str):
	"""Autocomplete prompt profiles defined in translator_gui (config prompt_profiles)."""
	try:
	cfg = load_config()
	profiles_dict = cfg.get("prompt_profiles") or {}
	profiles = list(profiles_dict.keys())

	# Fallback to hardcoded defaults if config has no profiles
	if not profiles:
	profiles = DEFAULT_PROMPT_PROFILES.copy()
	sys.stderr.write("[CONFIG] prompt_profiles missing; using built-in defaults for autocomplete\n")
	sys.stderr.flush()
	else:
	# Ensure default Universal is always present
	for default in DEFAULT_PROMPT_PROFILES:
	if default not in profiles:
	profiles.append(default)

	if "Universal" not in profiles:
	profiles.insert(0, "Universal")
	if current:
	profiles = [p for p in profiles if current.lower() in p.lower()]
	return [app_commands.Choice(name=p, value=p) for p in profiles[:25]]
	except Exception as e:
	sys.stderr.write(f"[AUTO] profile_autocomplete fallback due to error: {e}\n")
	sys.stderr.flush()
	return [app_commands.Choice(name="Universal", value="Universal")]

	@bot.tree.command(name="save", description="Save your API settings (encrypted per user)")
	@app_commands.describe(
	api_key="Primary API key to use by default",
	model="Default model to use",
	passphrase="Optional passphrase for encryption (else USER_CFG_MASTER_KEY is used)",
	multi_key_mode="Enable multi-key rotation pool",
	fallback_key="Enable fallback key list (uses the same multi keys)",
	multi_keys="Up to 50 API keys, one per line (Multi key 1..50)"
	)
	async def save_cmd(
	interaction: discord.Interaction,
	api_key: str,
	model: str,
	passphrase: Optional[str] = None,
	multi_key_mode: bool = False,
	fallback_key: bool = False,
	multi_keys: Optional[str] = None,
	):
	"""Persist encrypted API credentials for later /translate and /extract runs."""

	if not await _safe_defer(interaction, ephemeral=True):
	return

	user_id = interaction.user.id
	parsed_multi = _parse_multi_key_block(multi_keys, model)

	payload = {
	"api_key": api_key.strip(),
	"model": (model or "").strip(),
	"use_multi_api_keys": bool(multi_key_mode and parsed_multi),
	"multi_api_keys": parsed_multi,
	"use_fallback_keys": bool(fallback_key and parsed_multi),
	"fallback_keys": parsed_multi if fallback_key and parsed_multi else [],
	}

	try:
	encrypted = _encrypt_user_secret(user_id, payload, passphrase)
	except ValueError as e:
	await _safe_edit_original_response(interaction, content=f"❌ {e}")
	return
	except Exception as e:
	await _safe_edit_original_response(interaction, content=f"❌ Failed to save: {e}")
	return

	save_user_config(user_id, {"credentials": encrypted})

	note = "Encrypted with passphrase" if passphrase else "Encrypted with USER_CFG_MASTER_KEY"
	detail = "Multi-key rotation enabled" if payload["use_multi_api_keys"] else "Single key mode"
	embed = discord.Embed(
	title="✅ Saved credentials",
	description=(
	f"Model: `{payload['model'] or 'gpt-4o'}`\n"
	f"Primary key stored.\n"
	f"{detail}" + (f" ({len(parsed_multi)} keys)" if payload["use_multi_api_keys"] else "") + ".\n"
	f"{note}."
	),
	color=discord.Color.green(),
	)
	if payload["use_fallback_keys"]:
	embed.add_field(name="Fallback keys", value=f"{len(parsed_multi)} configured", inline=False)

	await _safe_edit_original_response(interaction, embed=embed)


	@bot.tree.command(name="translate", description="Translate EPUB, TXT, or PDF file")
	@app_commands.describe(
	file="EPUB, TXT, or PDF file to translate (optional if using url)",
	url="Google Drive or Dropbox link to file (optional if using file attachment)",
	custom_endpoint_url="Custom OpenAI-compatible base URL (auto-enables when set; omit to disable)",
	google_credentials_file="Google Cloud credentials JSON file upload (for Vertex AI models)",
	extraction_mode="Text extraction method (default: Enhanced/html2text)",
	temperature="Translation temperature 0.0-1.0 (default: 0.3)",
	batch_size="Paragraphs per batch (default: 10)",
	max_output_tokens="Max output tokens (default: 65536)",
	disable_smart_filter="Disable smart glossary filter (default: False)",
	duplicate_algorithm="Duplicate handling: auto/strict/balanced/aggressive/basic (default: balanced)",
	manual_glossary="Manual glossary file (.csv or .json) to upload and use instead of auto-generated",
	enable_auto_glossary="Enable automatic glossary generation (default: True)",
	request_merge_count="Chapters per request (set >=2 to enable request merging; <=1 disables; omit to disable)",
	split_the_merge="Split merged translation output back into separate files (default: True)",
	send_zip="Return output as a ZIP archive instead of individual file (default: False)",
	compression_factor="Compression factor (1.0-3.0; overrides auto-compression if set)",
	thinking="Enable/disable AI thinking capabilities (GPT/Gemini/DeepSeek) - Default: True",
	gemini_thinking_level="Gemini 3 thinking level (low/high) - Default: high",
	gemini_thinking_budget="Gemini thinking budget (-1=auto, 0=disabled) - Default: -1",
	gpt_effort="GPT-5/OpenAI thinking effort (none/low/medium/high/xhigh) - Default: medium",
	target_language="Target language",
	profile="Prompt profile from translator_gui (default: Universal)"
	)
	@app_commands.choices(extraction_mode=[
	app_commands.Choice(name="Enhanced (html2text)", value="enhanced"),
	app_commands.Choice(name="Standard (BeautifulSoup)", value="standard"),
	])
	@app_commands.choices(gemini_thinking_level=[
	app_commands.Choice(name="High", value="high"),
	app_commands.Choice(name="Low", value="low"),
	])
	@app_commands.choices(gpt_effort=[
	app_commands.Choice(name="None", value="none"),
	app_commands.Choice(name="Low", value="low"),
	app_commands.Choice(name="Medium", value="medium"),
	app_commands.Choice(name="High", value="high"),
	app_commands.Choice(name="XHigh", value="xhigh"),
	])
	@app_commands.autocomplete(model=model_autocomplete)
	@app_commands.autocomplete(profile=profile_autocomplete)
	async def translate(
	interaction: discord.Interaction,
	file: discord.Attachment = None,
	url: str = None,
	api_key: Optional[str] = None,
	passphrase: Optional[str] = None,
	model: Optional[str] = None,
	custom_endpoint_url: Optional[str] = None,
	google_credentials_file: discord.Attachment = None,
	extraction_mode: str = "enhanced",
	temperature: float = 0.3,
	batch_size: int = 10,
	max_output_tokens: int = 65536,
	disable_smart_filter: bool = False,
	duplicate_algorithm: str = "balanced",
	manual_glossary: discord.Attachment = None,
	enable_auto_glossary: bool = True,
	request_merge_count: Optional[int] = None,
	split_the_merge: bool = True,
	send_zip: bool = False,
	compression_factor: float = None,
	thinking: bool = True,
	gemini_thinking_level: str = "high",
	gemini_thinking_budget: int = -1,
	gpt_effort: str = "medium",
	target_language: str = "English",
	profile: str = "Universal"
	):
	"""Translate file using Glossarion"""

	# Acknowledge ASAP to avoid 10062 Unknown interaction under load.
	if not await _safe_defer(interaction, ephemeral=_ephemeral(interaction)):
	return

	_ensure_stable_cwd()

	if not GLOSSARION_AVAILABLE:
	await _safe_edit_original_response(interaction, content="❌ Glossarion not available")
	return

	# Validate input - must have either file or URL
	if not file and not url:
	await _safe_edit_original_response(interaction, content="❌ Please provide either a file attachment or a URL")
	return

	# Get filename and validate extension
	if file:
	filename = file.filename
	elif url:
	# Extract filename from URL or use default
	if 'drive.google.com' in url:
	filename = 'google_drive_file.epub' # Will be updated after download
	elif 'dropbox.com' in url:
	filename = 'dropbox_file.epub' # Will be updated after download
	else:
	# Try to get filename from URL path
	from urllib.parse import urlparse, unquote
	parsed = urlparse(url)
	filename = unquote(os.path.basename(parsed.path)) or 'downloaded_file.epub'

	# Never trust user/remote-provided names to be a safe path.
	# Keep /translate isolated from path traversal and accidental subdirectories.
	filename = os.path.basename(filename)

	# Validate file extension
	if not (filename.endswith('.epub') or filename.endswith('.txt') or filename.endswith('.pdf')):
	await _safe_edit_original_response(interaction, content="❌ File must be EPUB, TXT, or PDF format")
	return

	# Validate request merge count early (if explicitly provided)
	if request_merge_count is not None and request_merge_count < 0:
	await _safe_edit_original_response(interaction, content="❌ request_merge_count must be >= 0")
	return

	# Validate custom endpoint URL early (if provided)
	if custom_endpoint_url is not None:
	custom_endpoint_url = custom_endpoint_url.strip()
	if custom_endpoint_url and not (custom_endpoint_url.startswith('http://') or custom_endpoint_url.startswith('https://')):
	await _safe_edit_original_response(interaction, content="❌ custom_endpoint_url must start with http:// or https://")
	return

	user_id = interaction.user.id
	user_config = load_user_config(user_id)

	try:
	saved_creds = load_saved_credentials(user_id, passphrase)
	except ValueError as e:
	await _safe_edit_original_response(interaction, content=f"❌ {e}")
	return
	except Exception:
	saved_creds = None

	# Load config early so we can default the model without relying on autocomplete.
	config = load_config()

	# Default model: prefer explicit user input, otherwise config.json, then env var, then a safe fallback.
	if saved_creds and not model:
	model = (saved_creds.get('model') or '').strip()
	model = (model or '').strip() or (config.get('model') or '').strip() or (os.getenv('MODEL') or '').strip() or 'gpt-4o'


	if saved_creds and not api_key:
	api_key = saved_creds.get('api_key')
	api_key = (api_key or '').strip()
	if not api_key:
	await _safe_edit_original_response(interaction, content="❌ No API key available. Provide api_key or run /save first (with passphrase if set).")
	return

	use_multi_keys = bool(saved_creds and saved_creds.get("use_multi_api_keys") and saved_creds.get("multi_api_keys"))
	if use_multi_keys:
	os.environ['USE_MULTI_API_KEYS'] = '1'
	os.environ['USE_MULTI_KEYS'] = '1'
	try:
	from unified_api_client import UnifiedClient
	mk_list = saved_creds.get("multi_api_keys", [])
	UnifiedClient.set_in_memory_multi_keys(mk_list)
	except Exception:
	pass
	else:
	os.environ['USE_MULTI_API_KEYS'] = '0'
	os.environ['USE_MULTI_KEYS'] = '0'
	try:
	from unified_api_client import UnifiedClient
	UnifiedClient.clear_in_memory_multi_keys()
	except Exception:
	pass

	use_fallback_keys = bool(saved_creds and saved_creds.get("use_fallback_keys") and saved_creds.get("fallback_keys"))
	if use_fallback_keys:
	os.environ['USE_FALLBACK_KEYS'] = '1'
	os.environ['FALLBACK_KEYS'] = json.dumps(saved_creds.get("fallback_keys", []))
	else:
	os.environ['USE_FALLBACK_KEYS'] = '0'
	os.environ.pop('FALLBACK_KEYS', None)

	# Initial response (we already deferred; now edit the original response)
	profile_note = (
	f"Profile: {profile or 'Universal'}\n"
	"Note: target_lang replacement is skipped for profile prompts; choose the profile language you need.\n"
	"Profiles ending with _txt use html2text (default). Others use BeautifulSoup. 'ocr' profiles are for images."
	)
	embed = discord.Embed(
	title="📚 Translation Started",
	description=(
	f"File: {filename}\n"
	f"Model: {model}\n"
	f"Target: {target_language}\n\n"
	f"{profile_note}"
	),
	color=discord.Color.blue()
	)
	msg_obj = await _safe_edit_original_response(interaction, embed=embed)
	if msg_obj is None:
	return
	try:
	message = await interaction.original_response()
	except Exception:
	message = None
	if message is None:
	return
	# Persist user preferences for next runs
	try:
	save_user_config(user_id, {
	"translate": {
	"model": model,
	"custom_endpoint_url": custom_endpoint_url,
	"extraction_mode": extraction_mode,
	"temperature": temperature,
	"batch_size": batch_size,
	"max_output_tokens": max_output_tokens,
	"disable_smart_filter": disable_smart_filter,
	"duplicate_algorithm": duplicate_algorithm,
	"enable_auto_glossary": enable_auto_glossary,
	"request_merge_count": request_merge_count,
	"split_the_merge": split_the_merge,
	"send_zip": send_zip,
	"compression_factor": compression_factor,
	"thinking": thinking,
	"gemini_thinking_level": gemini_thinking_level,
	"gemini_thinking_budget": gemini_thinking_budget,
	"gpt_effort": gpt_effort,
	"target_language": target_language,
	"profile": profile,
	}
	})
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to persist /translate prefs: {e}\n")
	sys.stderr.flush()

	# Create temp directory
	temp_dir = tempfile.mkdtemp(
	prefix=f"discord_translate_{interaction.user.id}_",
	dir=BOT_TMPDIR or None,
	)
	input_path = os.path.join(temp_dir, filename)

	try:
	# Download file from attachment or URL
	if file:
	await file.save(input_path)
	elif url:
	import aiohttp

	# Convert Google Drive/Dropbox share links to direct download links
	download_url = url
	if 'drive.google.com' in url:
	# Extract file ID from various Google Drive URL formats
	if '/file/d/' in url:
	file_id = url.split('/file/d/')[1].split('/')[0]
	elif 'id=' in url:
	file_id = url.split('id=')[1].split('&')[0]
	else:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Invalid URL",
	description="Could not parse Google Drive file ID from URL",
	color=discord.Color.red()
	))
	return
	download_url = f"https://drive.google.com/uc?export=download&id={file_id}"
	elif 'dropbox.com' in url:
	# Convert Dropbox share link to direct download
	download_url = url.replace('www.dropbox.com', 'dl.dropboxusercontent.com').replace('?dl=0', '').replace('?dl=1', '')
	if '?dl=' not in download_url:
	download_url += '?dl=1'

	# Download the file
	async with aiohttp.ClientSession() as session:
	async with session.get(download_url) as response:
	if response.status == 200:
	with open(input_path, 'wb') as f:
	f.write(await response.read())

	# Try to get actual filename from response headers
	if 'content-disposition' in response.headers:
	import re
	content_disp = response.headers['content-disposition']
	fname_match = re.findall('filename="(.+)"', content_disp)
	if fname_match:
	actual_filename = fname_match[0]
	# Update filename if we got a better one
	new_input_path = os.path.join(temp_dir, actual_filename)
	os.rename(input_path, new_input_path)
	input_path = new_input_path
	filename = actual_filename
	else:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Download Failed",
	description=f"Failed to download file from URL (HTTP {response.status})",
	color=discord.Color.red()
	))
	return

	# Ensure the input file actually exists before starting the executor thread.
	# If this fails, /translate can end up in a bad state (e.g. cwd inside a deleted temp dir).
	try:
	if not os.path.isfile(input_path):
	raise FileNotFoundError(f"Downloaded/attached file not found on disk: {input_path}")
	if os.path.getsize(input_path) <= 0:
	raise FileNotFoundError(f"Downloaded/attached file is empty: {input_path}")
	except Exception as e:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Input File Error",
	description=str(e),
	color=discord.Color.red()
	))
	return

	# Get system prompt from config
	prompt_profiles = config.get('prompt_profiles', {})
	chosen_profile = (profile or "Universal").strip()
	system_prompt = None
	if prompt_profiles:
	# When a profile is chosen, use it as-is; do not substitute target_lang (per user note).
	system_prompt = prompt_profiles.get(chosen_profile)
	if system_prompt is None and 'Universal' in prompt_profiles:
	system_prompt = prompt_profiles['Universal']
	if not system_prompt:
	# Fallback to basic prompt
	system_prompt = f"Translate to {target_language}. Preserve all formatting."

	# Custom OpenAI Endpoint (single source of truth: custom_endpoint_url)
	# If omitted, keep disabled.
	if custom_endpoint_url:
	os.environ['USE_CUSTOM_OPENAI_ENDPOINT'] = '1'
	os.environ['OPENAI_CUSTOM_BASE_URL'] = custom_endpoint_url
	sys.stderr.write(f"[CONFIG] Custom OpenAI Endpoint enabled: {custom_endpoint_url}\n")
	else:
	os.environ['USE_CUSTOM_OPENAI_ENDPOINT'] = '0'
	os.environ['OPENAI_CUSTOM_BASE_URL'] = ''

	# Set model and API key
	os.environ['MODEL'] = model
	os.environ['SYSTEM_PROMPT'] = system_prompt
	os.environ['PROFILE_NAME'] = chosen_profile.lower() if chosen_profile else "universal"
	os.environ['OUTPUT_DIRECTORY'] = temp_dir
	os.environ['ENABLE_THOUGHTS'] = '0'

	# Set translation parameters
	os.environ['BATCH_TRANSLATION'] = '1'
	os.environ['BATCH_SIZE'] = str(batch_size)
	os.environ['MAX_OUTPUT_TOKENS'] = str(max_output_tokens)
	os.environ['TRANSLATION_TEMPERATURE'] = str(temperature)
	# Preserve markdown/structure and force BeautifulSoup for traditional APIs (from Other Settings)
	os.environ['ENHANCED_PRESERVE_STRUCTURE'] = '1' if config.get('enhanced_preserve_structure', True) else '0'
	os.environ['FORCE_BS_FOR_TRADITIONAL'] = '1' if config.get('force_bs_for_traditional', False) else '0'

	# Handle compression factor
	# TransateKRtoEN ultimately uses COMPRESSION_FACTOR; "AUTO_COMPRESSION_FACTOR" is treated
	# as a UI/bot toggle only.
	if compression_factor is not None:
	# Explicit override from the slash command.
	os.environ['COMPRESSION_FACTOR'] = str(compression_factor)
	os.environ['AUTO_COMPRESSION_FACTOR'] = '0'
	sys.stderr.write(f"[CONFIG] Manual compression factor: {compression_factor} (Auto-compression disabled)\n")
	else:
	# Respect config setting for auto-compression.
	# (config.json uses auto_compress_enabled; older variants may use auto_compression_factor)
	auto_comp = bool(config.get('auto_compress_enabled', config.get('auto_compression_factor', True)))
	os.environ['AUTO_COMPRESSION_FACTOR'] = '1' if auto_comp else '0'

	# Always set a deterministic COMPRESSION_FACTOR so downstream code doesn't fall back
	# to a different default unexpectedly.
	os.environ['COMPRESSION_FACTOR'] = str(config.get('compression_factor', 3.0))

	# Disable contextual translation by default (each batch is independent)
	os.environ['CONTEXTUAL'] = '0'
	# Disable emergency paragraph restoration
	os.environ['EMERGENCY_PARAGRAPH_RESTORE'] = '0'
	# Enable AI artifact removal
	os.environ['REMOVE_AI_ARTIFACTS'] = '1'
	# Retain original source filenames (no 'response_' prefix)
	os.environ['RETAIN_SOURCE_EXTENSION'] = '1'

	# Disable input token limit by default (no chapter size restrictions)
	os.environ['TOKEN_LIMIT_DISABLED'] = '1'
	os.environ['DISABLE_INPUT_TOKEN_LIMIT'] = '1'
	os.environ['MAX_INPUT_TOKENS'] = '' # Empty string = unlimited (matches GUI behavior)

	# Disable image translation for Discord bot (images don't work well via Discord)
	os.environ['ENABLE_IMAGE_TRANSLATION'] = '0'

	# Set extraction mode
	os.environ['TEXT_EXTRACTION_METHOD'] = extraction_mode
	if extraction_mode == 'enhanced':
	os.environ['EXTRACTION_MODE'] = 'enhanced'
	os.environ['ENHANCED_FILTERING'] = 'smart'
	os.environ['ENHANCED_PRESERVE_STRUCTURE'] = '1'
	else:
	os.environ['EXTRACTION_MODE'] = 'smart'
	os.environ['FILE_FILTERING_LEVEL'] = 'smart'

	# Set PDF-specific styling extraction variables from pdf_extractor
	# These ensure PDF font sizes, alignments, and styles are preserved
	if filename.endswith('.pdf'):
	sys.stderr.write(f"[CONFIG] Enabling PDF formatting extraction (font size, alignment, etc.)\n")
	sys.stderr.flush()
	# Force XHTML render mode for better PDF extraction quality
	os.environ['PDF_RENDER_MODE'] = 'xhtml'
	sys.stderr.write(f"[CONFIG] Using XHTML render mode for PDF\n")
	sys.stderr.flush()
	# The pdf_extractor.generate_css_from_pdf() function will automatically
	# detect and apply: base_font_size, font_family, text_align, line_height_ratio
	# from the actual PDF file during processing

	# Enable automatic glossary generation (user configurable)
	os.environ['ENABLE_AUTO_GLOSSARY'] = '1' if enable_auto_glossary else '0'
	# Set glossary parameters (use config if available, otherwise use defaults)
	os.environ['GLOSSARY_MIN_FREQUENCY'] = str(config.get('glossary_min_frequency', 2))
	os.environ['GLOSSARY_MAX_NAMES'] = str(config.get('glossary_max_names', 50))
	os.environ['GLOSSARY_MAX_TITLES'] = str(config.get('glossary_max_titles', 30))
	os.environ['APPEND_GLOSSARY'] = '1'

	# IMPORTANT: Treat empty-string config values as missing.
	# TransateKRtoEN.build_system_prompt() hard-fails if APPEND_GLOSSARY_PROMPT is blank.
	append_prompt = (config.get('append_glossary_prompt') or '').strip()
	if not append_prompt:
	append_prompt = '- Follow this reference glossary for consistent translation (Do not output any raw entries):'
	if not append_prompt.endswith('\n'):
	append_prompt += '\n'
	os.environ['APPEND_GLOSSARY_PROMPT'] = append_prompt

	# CRITICAL: Auto glossary uses AUTO_GLOSSARY_PROMPT (unified prompt used by the GUI).
	# If this is missing, GlossaryManager falls back to the legacy honorific/title regex scanner.
	os.environ['AUTO_GLOSSARY_PROMPT'] = config.get('unified_auto_glosary_prompt3', '') or ''
	# Ensure glossary translations target the same language as the main translation
	os.environ['GLOSSARY_TARGET_LANGUAGE'] = target_language
	os.environ['OUTPUT_LANGUAGE'] = target_language
	# Align throttling/timeouts with config defaults (matches GUI behavior)
	os.environ['SEND_INTERVAL_SECONDS'] = str(config.get('delay', 2.0))
	os.environ['THREAD_SUBMISSION_DELAY_SECONDS'] = str(config.get('thread_submission_delay', 0.5))
	os.environ['RETRY_TRUNCATED'] = '1' # Enable auto-retry truncated responses by default
	os.environ['MAX_RETRY_TOKENS'] = str(max_output_tokens) # Align retry token limit to output token limit
	os.environ['RETRY_TIMEOUT'] = '1' if config.get('retry_timeout', False) else '0'
	os.environ['CHUNK_TIMEOUT'] = str(config.get('chunk_timeout', 1800))
	os.environ['ENABLE_HTTP_TUNING'] = '1' if config.get('enable_http_tuning', False) else '0'
	os.environ['CONNECT_TIMEOUT'] = str(config.get('connect_timeout', 10))
	# Don't set READ_TIMEOUT for the bot; chunk timeout is the single source of truth.
	os.environ.pop('READ_TIMEOUT', None)
	os.environ['HTTP_POOL_CONNECTIONS'] = str(config.get('http_pool_connections', 20))
	os.environ['HTTP_POOL_MAXSIZE'] = str(config.get('http_pool_maxsize', 50))
	os.environ['IGNORE_RETRY_AFTER'] = '1' if config.get('ignore_retry_after', False) else '0'
	# Cap retries for the Discord bot to keep runs predictable.
	os.environ['MAX_RETRIES'] = '3'
	# Set all glossary variables from GUI
	os.environ['GLOSSARY_COMPRESSION_FACTOR'] = str(config.get('glossary_compression_factor', 1.2))
	# Enable glossary prompt compression (filtering unused entries) by default
	os.environ['COMPRESS_GLOSSARY_PROMPT'] = '1' if config.get('compress_glossary_prompt', True) else '0'
	os.environ['GLOSSARY_FILTER_MODE'] = config.get('glossary_filter_mode', 'all')
	os.environ['GLOSSARY_STRIP_HONORIFICS'] = '1' if config.get('glossary_strip_honorifics', True) else '0'
	os.environ['GLOSSARY_FUZZY_THRESHOLD'] = str(config.get('glossary_fuzzy_threshold', 0.90))
	os.environ['GLOSSARY_MAX_TEXT_SIZE'] = str(config.get('glossary_max_text_size', 50000))
	# Cap glossary max sentences for the Discord bot to keep prompts small/predictable.
	# (GlossaryManager reads this via GLOSSARY_MAX_SENTENCES)
	os.environ['GLOSSARY_MAX_SENTENCES'] = '200'
	os.environ['GLOSSARY_CHAPTER_SPLIT_THRESHOLD'] = str(config.get('glossary_chapter_split_threshold', 50000))
	os.environ['GLOSSARY_SKIP_FREQUENCY_CHECK'] = '0' # Enable frequency checking
	os.environ['CONTEXT_WINDOW_SIZE'] = str(config.get('glossary_context_window', 2))
	os.environ['GLOSSARY_USE_LEGACY_CSV'] = '0' # Use modern JSON format
	os.environ['GLOSSARY_DUPLICATE_KEY_MODE'] = config.get('glossary_duplicate_key_mode', 'auto')
	os.environ['GLOSSARY_DUPLICATE_CUSTOM_FIELD'] = config.get('glossary_duplicate_custom_field', '')
	os.environ['GLOSSARY_DUPLICATE_ALGORITHM'] = duplicate_algorithm
	# Gender context and description for automatic glossary (enabled by default)
	os.environ['GLOSSARY_INCLUDE_GENDER_CONTEXT'] = '1' if config.get('include_gender_context', True) else '0'
	os.environ['GLOSSARY_INCLUDE_DESCRIPTION'] = '1' if config.get('include_description', True) else '0'
	# Custom glossary fields (additional columns) - default to ['description']
	custom_fields = config.get('custom_glossary_fields', [])
	if not custom_fields and not config.get('custom_field_description_removed', False):
	custom_fields = ['description']
	os.environ['GLOSSARY_CUSTOM_FIELDS'] = json.dumps(custom_fields)
	# Glossary-specific overrides for API settings
	os.environ['GLOSSARY_MAX_OUTPUT_TOKENS'] = str(config.get('glossary_max_output_tokens', max_output_tokens))
	os.environ['GLOSSARY_TEMPERATURE'] = str(config.get('manual_glossary_temperature', 0.1))
	os.environ['GLOSSARY_REQUEST_MERGING_ENABLED'] = '0' # Disable by default
	os.environ['GLOSSARY_REQUEST_MERGE_COUNT'] = str(config.get('glossary_request_merge_count', 10))

	# Set duplicate detection mode to balanced
	os.environ['DUPLICATE_DETECTION_MODE'] = 'balanced'

	# Disable batch translate headers (metadata translation)
	os.environ['BATCH_TRANSLATE_HEADERS'] = '0'

	# Set manual glossary path if provided (download attachment first)
	if manual_glossary:
	# Validate glossary file extension
	if manual_glossary.filename.endswith('.csv') or manual_glossary.filename.endswith('.json'):
	glossary_path = os.path.join(temp_dir, manual_glossary.filename)
	await manual_glossary.save(glossary_path)
	os.environ['MANUAL_GLOSSARY'] = glossary_path
	sys.stderr.write(f"[CONFIG] Using manual glossary: {manual_glossary.filename}\n")
	sys.stderr.flush()
	else:
	sys.stderr.write(f"[WARNING] Manual glossary must be .csv or .json: {manual_glossary.filename}\n")
	sys.stderr.flush()

	# Request merging settings (combine multiple chapters into single API request)
	# Single source of truth: request_merge_count
	if request_merge_count is None:
	# If omitted, keep merging disabled
	request_merging_enabled = False
	request_merge_count_raw = 1
	else:
	request_merge_count_raw = int(request_merge_count)
	request_merging_enabled = request_merge_count_raw >= 2

	# Keep the count safe for downstream code (even when disabled)
	request_merge_count_effective = max(1, request_merge_count_raw)

	os.environ['REQUEST_MERGING_ENABLED'] = '1' if request_merging_enabled else '0'
	os.environ['REQUEST_MERGE_COUNT'] = str(request_merge_count_effective)
	os.environ['SPLIT_THE_MERGE'] = '1' if split_the_merge else '0'
	os.environ['DISABLE_MERGE_FALLBACK'] = '1' # Mark as qa_failed if split fails
	os.environ['SYNTHETIC_MERGE_HEADERS'] = '1' # Use synthetic headers for better splitting

	# Disable Gemini safety filter by default (enabled for Discord bot)
	os.environ['DISABLE_GEMINI_SAFETY'] = 'true'

	# Handle Thinking Toggle
	# If thinking is True (default), we don't need to do anything as we respect the config/env
	# If thinking is False, we explicitly disable all thinking features
	if not thinking:
	os.environ['ENABLE_GPT_THINKING'] = '0'
	os.environ['ENABLE_GEMINI_THINKING'] = '0'
	os.environ['ENABLE_DEEPSEEK_THINKING'] = '0'
	sys.stderr.write(f"[CONFIG] Thinking capabilities disabled via command\n")

	# Handle Vertex AI / Google Cloud credentials
	if '@' in model or model.startswith('vertex/'):
	# Prefer an uploaded credentials file; otherwise fall back to config.json.
	google_creds = None
	if google_credentials_file is not None:
	# Save uploaded creds into the job temp dir.
	# Discord provides the filename; ensure it's safe.
	creds_name = os.path.basename(getattr(google_credentials_file, 'filename', '') or 'google_credentials.json')
	if not creds_name.lower().endswith('.json'):
	creds_name = 'google_credentials.json'
	google_creds = os.path.join(temp_dir, creds_name)
	try:
	await google_credentials_file.save(google_creds)
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to save uploaded Google credentials: {e}\n")
	google_creds = None

	if google_creds is None:
	google_creds = config.get('google_cloud_credentials')

	if google_creds and os.path.exists(google_creds):
	os.environ['GOOGLE_APPLICATION_CREDENTIALS'] = google_creds
	sys.stderr.write(f"[CONFIG] Using Google Cloud credentials: {os.path.basename(google_creds)}\n")
	sys.stderr.flush()

	# Extract project ID from credentials
	try:
	with open(google_creds, 'r', encoding='utf-8') as f:
	creds_data = json.load(f)
	project_id = creds_data.get('project_id', 'vertex-ai-project')
	os.environ['GOOGLE_CLOUD_PROJECT'] = project_id
	if not api_key:
	api_key = project_id
	except Exception:
	pass

	# Set API key - TransateKRtoEN checks multiple env vars
	os.environ['API_KEY'] = api_key
	os.environ['OPENAI_API_KEY'] = api_key
	os.environ['OPENAI_OR_Gemini_API_KEY'] = api_key

	# Set provider-specific keys
	if 'claude' in model.lower():
	os.environ['ANTHROPIC_API_KEY'] = api_key
	elif 'gemini' in model.lower():
	os.environ['GOOGLE_API_KEY'] = api_key
	os.environ['GEMINI_API_KEY'] = api_key

	# Initialize translation state in global storage
	user_id = interaction.user.id
	translation_states[user_id] = {
	'logs': [],
	'show_full': False,
	'stop_requested': False,
	'last_update': 0,
	'pending_update': False
	}
	state = translation_states[user_id]

	def log_callback(msg):
	if msg and msg.strip():
	state['logs'].append(msg.strip())
	# Use stderr to avoid recursion (stdout is redirected to callback)
	sys.stderr.write(f"[LOG] {msg.strip()}\n")
	sys.stderr.flush()

	# Rate limit: update at most once per second to avoid Discord rate limits
	import time
	current_time = time.time()
	if current_time - state['last_update'] >= 1.0:
	state['last_update'] = current_time
	state['pending_update'] = False
	asyncio.run_coroutine_threadsafe(update_progress(), bot.loop)
	else:
	# Mark that we have a pending update
	state['pending_update'] = True

	def stop_callback():
	"""Check if stop was requested"""
	return state['stop_requested']

	async def periodic_update_check():
	"""Check for pending updates every second and flush them"""
	import time
	while user_id in translation_states and not state['stop_requested']:
	await asyncio.sleep(1)
	if state.get('pending_update', False):
	state['pending_update'] = False
	state['last_update'] = time.time()
	await update_progress()

	async def update_progress():
	try:
	logs = state['logs']
	# Respect the user's choice of log view (show_full)
	if state['show_full']:
	# Show all logs, truncated to Discord's 4096 char limit
	log_text = '\n'.join(logs)
	if len(log_text) > 3900:
	log_text = "..." + log_text[-3900:]
	else:
	# Show last 10 logs (increased from 5 for better visibility)
	log_text = '\n'.join(logs[-10:])
	if len(log_text) > 800:
	log_text = log_text[-800:]

	if not log_text:
	log_text = "Starting..."

	embed = discord.Embed(
	title="📚 Translation in Progress",
	description=f"Status: Processing... ({len(logs)} logs)\n\n```{log_text}```",
	color=discord.Color.blue()
	)

	# Add buttons to toggle log view and stop translation
	view = LogView(user_id)
	await message.edit(embed=embed, view=view)
	except Exception as e:
	sys.stderr.write(f"[ERROR] Failed to update progress: {e}\n")
	sys.stderr.flush()

	# Run translation
	await update_progress()

	# Start periodic update checker
	update_task = asyncio.create_task(periodic_update_check())

	def run_translation():
	# Ensure we aren't running inside a deleted directory.
	_ensure_stable_cwd()

	sys.stderr.write(f"[TRANSLATE] Starting translation for: {input_path}\\n")
	sys.stderr.write(f"[TRANSLATE] Temp directory: {temp_dir}\\n")
	sys.stderr.flush()

	# IMPORTANT: Do NOT chdir() in a multi-command Discord bot.
	# chdir() is process-wide and can break other concurrent interactions.
	# TransateKRtoEN is patched to respect OUTPUT_DIRECTORY for absolute output paths.
	original_argv = sys.argv[:]
	try:
	sys.argv = ['discord_bot.py', input_path]
	result = TransateKRtoEN.main(log_callback=log_callback, stop_callback=stop_callback)

	sys.stderr.write(f"[TRANSLATE] Translation completed\\n")
	sys.stderr.flush()
	return result
	finally:
	# Prevent leaking argv changes across commands.
	sys.argv = original_argv

	loop = asyncio.get_event_loop()
	await loop.run_in_executor(None, run_translation)

	# Cancel the periodic update task
	update_task.cancel()
	try:
	await update_task
	except asyncio.CancelledError:
	pass

	# Determine output format and file
	output_file_path = None
	output_display_name = None
	is_zip_output = False

	# Prefer deterministic output selection from the translation output folder.
	# TransateKRtoEN writes into: OUTPUT_DIRECTORY/<file_base>/...
	output_base = os.path.splitext(os.path.basename(filename))[0]
	safe_base = output_base.replace('/', '_').replace('\\', '_').replace(':', '_').replace('*', '_').replace('?', '_').replace('"', '_').replace('<', '_').replace('>', '_').replace('\|', '_')
	preferred_output_dir = os.path.join(temp_dir, filename)

	# The translator historically used the raw base name; keep both candidates for compatibility.
	candidate_dirs = [
	preferred_output_dir,
	os.path.join(temp_dir, output_base),
	os.path.join(temp_dir, safe_base),
	]
	existing_dir = None
	seen = set()
	for d in candidate_dirs:
	if d in seen:
	continue
	seen.add(d)
	try:
	if os.path.exists(d) and os.path.isdir(d):
	existing_dir = d
	break
	except Exception:
	continue

	output_subdir = preferred_output_dir
	if existing_dir:
	if existing_dir != preferred_output_dir and not os.path.exists(preferred_output_dir):
	try:
	os.replace(existing_dir, preferred_output_dir)
	output_subdir = preferred_output_dir
	except Exception:
	output_subdir = existing_dir
	else:
	output_subdir = preferred_output_dir if existing_dir == preferred_output_dir else existing_dir
	else:
	try:
	os.makedirs(preferred_output_dir, exist_ok=True)
	except OSError:
	output_subdir = os.path.join(temp_dir, safe_base)
	os.makedirs(output_subdir, exist_ok=True)

	def _pick_newest(d: str, exts: list[str], must_contain: Optional[str] = None) -> Optional[str]:
	try:
	if not os.path.exists(d) or not os.path.isdir(d):
	return None
	candidates = []
	for name in os.listdir(d):
	p = os.path.join(d, name)
	if p == input_path:
	continue
	if name.lower().endswith('.zip'):
	continue
	nlow = name.lower()
	if exts and not any(nlow.endswith(e) for e in exts):
	continue
	if must_contain and must_contain.lower() not in nlow:
	continue
	if os.path.isfile(p):
	try:
	mtime = os.path.getmtime(p)
	except Exception:
	mtime = 0
	candidates.append((mtime, p))
	if not candidates:
	return None
	candidates.sort(key=lambda t: t[0], reverse=True)
	return candidates[0][1]
	except Exception:
	return None

	input_ext = os.path.splitext(filename)[1].lower()

	# If user didn't request zip, try to pick the most likely final artifact.
	if not send_zip:
	sys.stderr.write(f"[OUTPUT] Selecting output from: {output_subdir}\\n")
	sys.stderr.flush()

	# Prefer translated-named artifacts for text/PDF flows.
	if input_ext == '.epub':
	output_file_path = _pick_newest(output_subdir, exts=['.epub'])
	elif input_ext == '.pdf':
	output_file_path = (
	_pick_newest(output_subdir, exts=['.pdf'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=['.html'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=['.txt'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=['.pdf', '.html', '.txt'])
	)
	else:
	# .txt and other text-like inputs
	output_file_path = (
	_pick_newest(output_subdir, exts=['.txt'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=['.pdf'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=['.html'], must_contain='_translated')
	or _pick_newest(output_subdir, exts=[input_ext])
	or _pick_newest(output_subdir, exts=['.pdf', '.html', '.txt'])
	)

	if output_file_path:
	output_display_name = os.path.basename(output_file_path)
	sys.stderr.write(f"[OUTPUT] Selected output file: {output_file_path}\\n")
	sys.stderr.flush()

	# If we selected a file but it doesn't exist, treat it as a miss and fall back to ZIP.
	try:
	if output_file_path and not os.path.exists(output_file_path):
	sys.stderr.write(f"[OUTPUT] Selected file missing on disk, falling back to ZIP: {output_file_path}\\n")
	sys.stderr.flush()
	output_file_path = None
	output_display_name = None
	except Exception:
	output_file_path = None
	output_display_name = None

	# If zip requested OR file not found, proceed with zipping
	if send_zip or not output_file_path:
	is_zip_output = True

	sys.stderr.write(f"[ZIP] Creating zip archive of output...\\n")
	sys.stderr.write(f"[ZIP] Temp dir: {temp_dir}\\n")
	sys.stderr.write(f"[ZIP] Output dir: {output_subdir}\\n")

	# Zip the translation output folder if it exists; otherwise zip the whole temp dir.
	if os.path.exists(output_subdir) and os.path.isdir(output_subdir):
	zip_source_dir = output_subdir
	sys.stderr.write(f"[ZIP] Using output directory as source\\n")
	else:
	zip_source_dir = temp_dir
	sys.stderr.write(f"[ZIP] Using temp dir as source (no output dir found)\\n")
	sys.stderr.flush()

	preferred_zip_name = f"{filename}.zip"
	zip_filename = preferred_zip_name
	zip_path = os.path.join(temp_dir, zip_filename)

	# Update status to show zipping
	embed = discord.Embed(
	title="📦 Creating Archive",
	description="Compressing output files...",
	color=discord.Color.blue()
	)
	try:
	await message.edit(embed=embed, view=None)
	except discord.errors.HTTPException:
	pass

	try:
	# Create zip archive in background thread
	def create_zip(target_path: str):
	sys.stderr.write(f"[ZIP] Starting compression to {os.path.basename(target_path)}...\\n")
	import zipfile
	files_added = 0
	with zipfile.ZipFile(target_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
	for root, dirs, files in os.walk(zip_source_dir):
	for file_item in files:
	file_path = os.path.join(root, file_item)
	# Skip zip and input
	if file_item.endswith('.zip'): continue
	if file_path == input_path: continue

	arcname = os.path.relpath(file_path, zip_source_dir)
	zipf.write(file_path, arcname)
	files_added += 1
	return target_path

	loop = asyncio.get_event_loop()
	try:
	await loop.run_in_executor(None, functools.partial(create_zip, zip_path))
	except (OSError, ValueError) as zip_err:
	fallback_zip_name = f"{safe_base}.zip"
	if zip_filename != fallback_zip_name:
	sys.stderr.write(f"[ZIP] Preferred zip name '{zip_filename}' failed ({zip_err}); falling back to safe name.\\n")
	zip_filename = fallback_zip_name
	zip_path = os.path.join(temp_dir, zip_filename)
	await loop.run_in_executor(None, functools.partial(create_zip, zip_path))
	else:
	raise

	output_file_path = zip_path
	output_display_name = zip_filename

	except Exception as e:
	sys.stderr.write(f"[ERROR] Failed to create zip: {e}\\n")
	raise e

	async def _dm_or_channel(content: str = None, embed: Optional[discord.Embed] = None, file: Optional[discord.File] = None):
	# Always prefer DM; fall back to channel if DMs blocked.
	try:
	await interaction.user.send(content=content, embed=embed, file=file)
	return True
	except discord.Forbidden:
	try:
	await interaction.channel.send(content=content, embed=embed, file=file)
	return True
	except Exception:
	return False
	except Exception:
	return False

	# Send the result (either zip or direct file)
	if os.path.exists(output_file_path):
	file_size = os.path.getsize(output_file_path)
	sys.stderr.write(f"[SUCCESS] Ready to send: {output_file_path} ({file_size / 1024 / 1024:.2f}MB)\\n")

	if _should_offload(file_size, send_zip):
	loop = asyncio.get_event_loop()
	download_url = None
	# 1) tmpfiles
	for uploader, name in (( _upload_to_tempsh, "temp.sh"), (_upload_to_tmpfiles, "tmpfiles"), (_upload_to_oracle_par, "oracle"), (_upload_to_gofile, "gofile")):
	try:
	download_url = await loop.run_in_executor(
	None,
	functools.partial(uploader, output_file_path, output_display_name),
	)
	break
	except Exception as e2:
	sys.stderr.write(f"[HOST ERROR] {name}: {e2}\n")
	continue
	if download_url:
	embed = discord.Embed(
	title="✅ Translation Complete!",
	description=(
	f"File: {output_display_name}\\n"
	f"Size: {file_size / 1024 / 1024:.2f}MB\\n"
	f"Download: <{download_url}>"
	),
	color=discord.Color.green()
	)
	await _dm_or_channel(embed=embed)
	else:
	await _dm_or_channel(
	content="Could not upload the output file right now. Please try again later."
	)
	else:
	if state['stop_requested']:
	title = "⏹️ Translation Stopped - Partial Results"
	desc_text = "Contains partial translation output."
	color = discord.Color.orange()
	else:
	title = "✅ Translation Complete!"
	desc_text = "Translation finished successfully."
	color = discord.Color.green()

	embed = discord.Embed(
	title=title,
	description=f"File: {output_display_name}\\nSize: {file_size / 1024 / 1024:.2f}MB\\n\\n{desc_text}",
	color=color
	)
	sent = await _dm_or_channel(embed=embed)

	try:
	msg_content = f"Here's your {('zipped ' if is_zip_output else '')}translation output!"
	await _dm_or_channel(
	content=msg_content,
	file=discord.File(output_file_path, filename=output_display_name),
	)
	except Exception:
	# Fallback: try uploading to Gofile if direct send fails
	try:
	loop = asyncio.get_event_loop()
	download_url = await loop.run_in_executor(
	None,
	functools.partial(_upload_to_gofile, output_file_path, output_display_name),
	)
	await _dm_or_channel(
	content=f"Download: {download_url}",
	)
	except Exception:
	await _dm_or_channel(
	content="Upload failed and Gofile is unavailable right now."
	)
	else:
	raise FileNotFoundError(f"Output file not found: {output_file_path}")

	except Exception as e:
	import traceback
	error = f"```\n{traceback.format_exc()[-1000:]}\n```"
	embed = discord.Embed(
	title="❌ Error",
	description=f"{str(e)}\n{error}",
	color=discord.Color.red()
	)
	try:
	await message.edit(embed=embed, view=None)
	except discord.errors.HTTPException:
	await interaction.followup.send(embed=embed)

	finally:
	# Cleanup translation state
	if user_id in translation_states:
	del translation_states[user_id]

	# Ensure we are not sitting inside the temp dir (or a deleted cwd) before deleting it.
	try:
	cwd = os.getcwd()
	except FileNotFoundError:
	try:
	os.chdir(src_dir)
	except Exception:
	pass
	else:
	try:
	if os.path.commonpath([os.path.abspath(cwd), os.path.abspath(temp_dir)]) == os.path.abspath(temp_dir):
	os.chdir(src_dir)
	except Exception:
	pass

	# Cleanup temp directory
	try:
	shutil.rmtree(temp_dir)
	except Exception:
	pass

	@bot.tree.command(name="settings", description="Show your saved Glossarion bot preferences")
	async def settings(interaction: discord.Interaction):
	"""Display the caller's saved /translate and /extract defaults."""

	if not await _safe_defer(interaction, ephemeral=True):
	return

	user_id = interaction.user.id
	cfg = load_user_config(user_id) or {}
	translate_cfg = cfg.get("translate") or {}
	extract_cfg = cfg.get("extract") or {}

	if not translate_cfg and not extract_cfg:
	await _safe_edit_original_response(
	interaction,
	content="ℹ️ No saved settings yet. Run /translate or /extract once to store them."
	)
	return

	def _fmt(section: dict) -> str:
	if not section:
	return "_none_"
	import json
	text = json.dumps(section, indent=2, ensure_ascii=False)
	if len(text) > 1500:
	text = text[:1500] + "... (truncated)"
	return f"```json\n{text}\n```"

	embed = discord.Embed(
	title="Your Saved Settings",
	color=discord.Color.blue()
	)
	embed.add_field(name="Translate", value=_fmt(translate_cfg), inline=False)
	embed.add_field(name="Extract", value=_fmt(extract_cfg), inline=False)

	await _safe_edit_original_response(interaction, embed=embed)

	@bot.tree.command(name="extract", description="Extract glossary from EPUB, TXT, or PDF file")
	@app_commands.describe(
	file="EPUB, TXT, or PDF file to extract glossary from (optional if using url)",
	url="Google Drive or Dropbox link to file (optional if using file attachment)",
	api_key="Your API key (optional after /save)",
	passphrase="Passphrase to decrypt saved credentials (if set in /save)",
	model="AI model to use (optional; defaults to config.json if omitted)",
	custom_endpoint_url="Custom OpenAI-compatible base URL (auto-enables when set; omit to disable)",
	google_credentials_file="Google Cloud credentials JSON file upload (for Vertex AI models)",
	extraction_mode="Text extraction method (default: Enhanced/html2text)",
	temperature="Glossary extraction temperature 0.0-1.0 (default: 0.1)",
	batch_size="Paragraphs per batch (default: 10)",
	max_output_tokens="Max output tokens (default: 65536)",
	glossary_compression_factor="Glossary compression factor (default: 1.2)",
	merge_count="Chapters per request (set >=2 to enable request merging; <=1 disables; omit to disable)",
	duplicate_algorithm="Duplicate handling: auto/strict/balanced/aggressive/basic (default: balanced)",
	send_zip="Return output as a ZIP archive instead of individual file (default: False)",
	thinking="Enable/disable AI thinking capabilities (GPT/Gemini/DeepSeek) - Default: True",
	gemini_thinking_level="Gemini 3 thinking level (low/high) - Default: high",
	gemini_thinking_budget="Gemini thinking budget (-1=auto, 0=disabled) - Default: -1",
	gpt_effort="GPT-5/OpenAI thinking effort (none/low/medium/high/xhigh) - Default: medium",
	target_language="Target language for translations"
	)
	@app_commands.choices(extraction_mode=[
	app_commands.Choice(name="Enhanced (html2text)", value="enhanced"),
	app_commands.Choice(name="Standard (BeautifulSoup)", value="standard"),
	])
	@app_commands.choices(gemini_thinking_level=[
	app_commands.Choice(name="High", value="high"),
	app_commands.Choice(name="Low", value="low"),
	])
	@app_commands.choices(gpt_effort=[
	app_commands.Choice(name="None", value="none"),
	app_commands.Choice(name="Low", value="low"),
	app_commands.Choice(name="Medium", value="medium"),
	app_commands.Choice(name="High", value="high"),
	app_commands.Choice(name="XHigh", value="xhigh"),
	])
	@app_commands.autocomplete(model=model_autocomplete)
	async def extract(
	interaction: discord.Interaction,
	file: discord.Attachment = None,
	url: str = None,
	api_key: Optional[str] = None,
	passphrase: Optional[str] = None,
	model: Optional[str] = None,
	custom_endpoint_url: Optional[str] = None,
	google_credentials_file: discord.Attachment = None,
	extraction_mode: str = "enhanced",
	temperature: float = 0.1,
	batch_size: int = 10,
	max_output_tokens: int = 65536,
	glossary_compression_factor: float = 1.2,
	merge_count: Optional[int] = None,
	duplicate_algorithm: str = "balanced",
	send_zip: bool = False,
	thinking: bool = True,
	gemini_thinking_level: str = "high",
	gemini_thinking_budget: int = -1,
	gpt_effort: str = "medium",
	target_language: str = "English"
	):
	"""Extract glossary from file using Glossarion"""

	# Acknowledge ASAP to avoid 10062 Unknown interaction under load.
	if not await _safe_defer(interaction, ephemeral=_ephemeral(interaction)):
	return

	_ensure_stable_cwd()

	if not GLOSSARION_AVAILABLE or not glossary_main:
	await _safe_edit_original_response(interaction, content="❌ Glossarion glossary extraction not available")
	return

	# Validate input - must have either file or URL
	if not file and not url:
	await _safe_edit_original_response(interaction, content="❌ Please provide either a file attachment or a URL")
	return

	# Get filename and validate extension
	if file:
	filename = file.filename
	elif url:
	# Extract filename from URL or use default
	if 'drive.google.com' in url:
	filename = 'google_drive_file.epub'
	elif 'dropbox.com' in url:
	filename = 'dropbox_file.epub'
	else:
	from urllib.parse import urlparse, unquote
	parsed = urlparse(url)
	filename = unquote(os.path.basename(parsed.path)) or 'downloaded_file.epub'

	# Never trust user/remote-provided names to be a safe path.
	# Keep /extract isolated from path traversal and accidental subdirectories.
	filename = os.path.basename(filename)

	# Validate file extension
	if not (filename.endswith('.epub') or filename.endswith('.txt') or filename.endswith('.pdf')):
	await _safe_edit_original_response(interaction, content="❌ File must be EPUB, TXT, or PDF format")
	return

	# Validate request merge count early (if explicitly provided)
	if merge_count is not None and merge_count < 0:
	await _safe_edit_original_response(interaction, content="❌ merge_count must be >= 0")
	return

	# Validate custom endpoint URL early (if provided)
	if custom_endpoint_url is not None:
	custom_endpoint_url = custom_endpoint_url.strip()
	if custom_endpoint_url and not (custom_endpoint_url.startswith('http://') or custom_endpoint_url.startswith('https://')):
	await _safe_edit_original_response(interaction, content="❌ custom_endpoint_url must start with http:// or https://")
	return
	user_id = interaction.user.id
	user_config = load_user_config(user_id)

	try:
	saved_creds = load_saved_credentials(user_id, passphrase)
	except ValueError as e:
	await _safe_edit_original_response(interaction, content=f"❌ {e}")
	return
	except Exception:
	saved_creds = None

	# Load config early so we can default the model without relying on autocomplete.
	config = load_config()

	# Default model: prefer explicit user input, otherwise config.json, then env var, then a safe fallback.
	if saved_creds and not model:
	model = (saved_creds.get('model') or '').strip()
	model = (model or '').strip() or (config.get('model') or '').strip() or (os.getenv('MODEL') or '').strip() or 'gpt-4o'

	if saved_creds and not api_key:
	api_key = saved_creds.get('api_key')
	api_key = (api_key or '').strip()
	if not api_key:
	await _safe_edit_original_response(interaction, content="❌ No API key available. Provide api_key or run /save first (with passphrase if set).")
	return

	use_multi_keys = bool(saved_creds and saved_creds.get("use_multi_api_keys") and saved_creds.get("multi_api_keys"))
	if use_multi_keys:
	os.environ['USE_MULTI_API_KEYS'] = '1'
	os.environ['USE_MULTI_KEYS'] = '1'
	try:
	from unified_api_client import UnifiedClient
	mk_list = saved_creds.get("multi_api_keys", [])
	UnifiedClient.set_in_memory_multi_keys(mk_list)
	except Exception:
	pass
	else:
	os.environ['USE_MULTI_API_KEYS'] = '0'
	os.environ['USE_MULTI_KEYS'] = '0'
	try:
	from unified_api_client import UnifiedClient
	UnifiedClient.clear_in_memory_multi_keys()
	except Exception:
	pass

	use_fallback_keys = bool(saved_creds and saved_creds.get("use_fallback_keys") and saved_creds.get("fallback_keys"))
	if use_fallback_keys:
	os.environ['USE_FALLBACK_KEYS'] = '1'
	os.environ['FALLBACK_KEYS'] = json.dumps(saved_creds.get("fallback_keys", []))
	else:
	os.environ['USE_FALLBACK_KEYS'] = '0'
	os.environ.pop('FALLBACK_KEYS', None)

	# Initial response (we already deferred; now edit the original response)
	embed = discord.Embed(
	title="📚 Glossary Extraction Started",
	description=f"File: {filename}\nModel: {model}\nTarget: {target_language}",
	color=discord.Color.blue()
	)
	msg_obj = await _safe_edit_original_response(interaction, embed=embed)
	if msg_obj is None:
	return
	try:
	message = await interaction.original_response()
	except Exception:
	message = None
	if message is None:
	return
	# Persist user preferences for next runs
	try:
	save_user_config(user_id, {
	"extract": {
	"model": model,
	"custom_endpoint_url": custom_endpoint_url,
	"extraction_mode": extraction_mode,
	"temperature": temperature,
	"batch_size": batch_size,
	"max_output_tokens": max_output_tokens,
	"glossary_compression_factor": glossary_compression_factor,
	"merge_count": merge_count,
	"duplicate_algorithm": duplicate_algorithm,
	"send_zip": send_zip,
	"thinking": thinking,
	"gemini_thinking_level": gemini_thinking_level,
	"gemini_thinking_budget": gemini_thinking_budget,
	"gpt_effort": gpt_effort,
	"target_language": target_language,
	}
	})
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to persist /extract prefs: {e}\n")
	sys.stderr.flush()

	# Create temp directory
	temp_dir = tempfile.mkdtemp(
	prefix=f"discord_extract_{interaction.user.id}_",
	dir=BOT_TMPDIR or None,
	)
	input_path = os.path.join(temp_dir, filename)

	try:
	# Download file from attachment or URL
	if file:
	await file.save(input_path)
	elif url:
	import aiohttp

	# Convert Google Drive/Dropbox share links to direct download links
	download_url = url
	if 'drive.google.com' in url:
	if '/file/d/' in url:
	file_id = url.split('/file/d/')[1].split('/')[0]
	elif 'id=' in url:
	file_id = url.split('id=')[1].split('&')[0]
	else:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Invalid URL",
	description="Could not parse Google Drive file ID from URL",
	color=discord.Color.red()
	))
	return
	download_url = f"https://drive.google.com/uc?export=download&id={file_id}"
	elif 'dropbox.com' in url:
	download_url = url.replace('www.dropbox.com', 'dl.dropboxusercontent.com').replace('?dl=0', '').replace('?dl=1', '')
	if '?dl=' not in download_url:
	download_url += '?dl=1'

	# Download the file
	async with aiohttp.ClientSession() as session:
	async with session.get(download_url) as response:
	if response.status == 200:
	with open(input_path, 'wb') as f:
	f.write(await response.read())

	# Try to get actual filename from response headers
	if 'content-disposition' in response.headers:
	import re
	content_disp = response.headers['content-disposition']
	fname_match = re.findall('filename="(.+)"', content_disp)
	if fname_match:
	actual_filename = os.path.basename(fname_match[0])
	new_input_path = os.path.join(temp_dir, actual_filename)
	os.rename(input_path, new_input_path)
	input_path = new_input_path
	filename = actual_filename
	else:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Download Failed",
	description=f"Failed to download file from URL (HTTP {response.status})",
	color=discord.Color.red()
	))
	return

	# Ensure the input file actually exists before starting the executor thread.
	try:
	if not os.path.isfile(input_path):
	raise FileNotFoundError(f"Downloaded/attached file not found on disk: {input_path}")
	if os.path.getsize(input_path) <= 0:
	raise FileNotFoundError(f"Downloaded/attached file is empty: {input_path}")
	except Exception as e:
	await interaction.edit_original_response(embed=discord.Embed(
	title="❌ Input File Error",
	description=str(e),
	color=discord.Color.red()
	))
	return

	# Get glossary prompts from config
	glossary_prompt = config.get('manual_glossary_prompt', '')

	# Custom OpenAI Endpoint (single source of truth: custom_endpoint_url)
	# If omitted, keep disabled.
	if custom_endpoint_url:
	os.environ['USE_CUSTOM_OPENAI_ENDPOINT'] = '1'
	os.environ['OPENAI_CUSTOM_BASE_URL'] = custom_endpoint_url
	sys.stderr.write(f"[CONFIG] Custom OpenAI Endpoint enabled: {custom_endpoint_url}\n")
	else:
	os.environ['USE_CUSTOM_OPENAI_ENDPOINT'] = '0'
	os.environ['OPENAI_CUSTOM_BASE_URL'] = ''

	# Set model and API key
	os.environ['MODEL'] = model
	os.environ['GLOSSARY_SYSTEM_PROMPT'] = glossary_prompt

	# Set translation parameters (same as /translate)
	os.environ['BATCH_TRANSLATION'] = '1'
	os.environ['BATCH_SIZE'] = str(batch_size)
	os.environ['MAX_OUTPUT_TOKENS'] = str(max_output_tokens)
	os.environ['GLOSSARY_TEMPERATURE'] = str(temperature)
	os.environ['TRANSLATION_TEMPERATURE'] = str(temperature)
	os.environ['GLOSSARY_MAX_OUTPUT_TOKENS'] = str(max_output_tokens)
	# Preserve markdown/structure and force BeautifulSoup for traditional APIs (from Other Settings)
	os.environ['ENHANCED_PRESERVE_STRUCTURE'] = '1' if config.get('enhanced_preserve_structure', True) else '0'
	os.environ['FORCE_BS_FOR_TRADITIONAL'] = '1' if config.get('force_bs_for_traditional', False) else '0'

	# Set extraction mode
	os.environ['TEXT_EXTRACTION_METHOD'] = extraction_mode
	if extraction_mode == 'enhanced':
	os.environ['EXTRACTION_MODE'] = 'enhanced'
	os.environ['ENHANCED_FILTERING'] = 'smart'
	os.environ['ENHANCED_PRESERVE_STRUCTURE'] = '1'
	else:
	os.environ['EXTRACTION_MODE'] = 'smart'
	os.environ['FILE_FILTERING_LEVEL'] = 'smart'

	# Set PDF-specific styling extraction variables from pdf_extractor
	# These ensure PDF font sizes, alignments, and styles are preserved
	if filename.endswith('.pdf'):
	sys.stderr.write(f"[CONFIG] Enabling PDF formatting extraction (font size, alignment, etc.)\n")
	sys.stderr.flush()
	# Force XHTML render mode for better PDF extraction quality
	os.environ['PDF_RENDER_MODE'] = 'xhtml'
	sys.stderr.write(f"[CONFIG] Using XHTML render mode for PDF\n")
	sys.stderr.flush()
	# The pdf_extractor.generate_css_from_pdf() function will automatically
	# detect and apply: base_font_size, font_family, text_align, line_height_ratio
	# from the actual PDF file during processing

	# Set all glossary variables from config (same as /translate)
	os.environ['ENABLE_AUTO_GLOSSARY'] = '1'
	os.environ['GLOSSARY_MIN_FREQUENCY'] = str(config.get('glossary_min_frequency', 2))
	os.environ['GLOSSARY_MAX_NAMES'] = str(config.get('glossary_max_names', 50))
	os.environ['GLOSSARY_MAX_TITLES'] = str(config.get('glossary_max_titles', 30))
	os.environ['GLOSSARY_COMPRESSION_FACTOR'] = str(glossary_compression_factor)
	os.environ['GLOSSARY_FILTER_MODE'] = config.get('glossary_filter_mode', 'all')
	os.environ['GLOSSARY_STRIP_HONORIFICS'] = '1' if config.get('glossary_strip_honorifics', True) else '0'
	os.environ['GLOSSARY_FUZZY_THRESHOLD'] = str(config.get('glossary_fuzzy_threshold', 0.90))
	os.environ['GLOSSARY_MAX_TEXT_SIZE'] = str(config.get('glossary_max_text_size', 50000))
	# Cap glossary max sentences for the Discord bot to keep prompts small/predictable.
	# (GlossaryManager reads this via GLOSSARY_MAX_SENTENCES)
	os.environ['GLOSSARY_MAX_SENTENCES'] = '200'
	os.environ['GLOSSARY_CHAPTER_SPLIT_THRESHOLD'] = str(config.get('glossary_chapter_split_threshold', 50000))
	os.environ['GLOSSARY_SKIP_FREQUENCY_CHECK'] = '0'
	os.environ['CONTEXT_WINDOW_SIZE'] = str(config.get('glossary_context_window', 2))
	os.environ['GLOSSARY_CONTEXT_LIMIT'] = str(config.get('manual_context_limit', 2))
	os.environ['GLOSSARY_USE_LEGACY_CSV'] = '0'
	os.environ['GLOSSARY_DUPLICATE_KEY_MODE'] = 'skip'
	os.environ['GLOSSARY_DISABLE_HONORIFICS_FILTER'] = '1' if config.get('glossary_disable_honorifics_filter', False) else '0'
	# Ensure glossary output language matches the command's target_language
	os.environ['GLOSSARY_TARGET_LANGUAGE'] = target_language
	os.environ['OUTPUT_LANGUAGE'] = target_language
	# Align throttling/timeouts with config defaults (matches GUI behavior)
	os.environ['SEND_INTERVAL_SECONDS'] = str(config.get('delay', 2.0))
	os.environ['THREAD_SUBMISSION_DELAY_SECONDS'] = str(config.get('thread_submission_delay', 0.5))
	os.environ['RETRY_TIMEOUT'] = '1' if config.get('retry_timeout', False) else '0'
	os.environ['CHUNK_TIMEOUT'] = str(config.get('chunk_timeout', 1800))
	os.environ['ENABLE_HTTP_TUNING'] = '1' if config.get('enable_http_tuning', False) else '0'
	os.environ['CONNECT_TIMEOUT'] = str(config.get('connect_timeout', 10))
	# Don't set READ_TIMEOUT for the bot; chunk timeout is the single source of truth.
	os.environ.pop('READ_TIMEOUT', None)
	os.environ['HTTP_POOL_CONNECTIONS'] = str(config.get('http_pool_connections', 20))
	os.environ['HTTP_POOL_MAXSIZE'] = str(config.get('http_pool_maxsize', 50))
	os.environ['IGNORE_RETRY_AFTER'] = '1' if config.get('ignore_retry_after', False) else '0'
	# Cap retries for the Discord bot to keep runs predictable.
	os.environ['MAX_RETRIES'] = '3'

	# Glossary request merging settings
	# Single source of truth: merge_count
	if merge_count is None:
	# If omitted, keep merging disabled
	glossary_request_merging_enabled = False
	glossary_request_merge_count_raw = 1
	else:
	glossary_request_merge_count_raw = int(merge_count)
	glossary_request_merging_enabled = glossary_request_merge_count_raw >= 2

	# Keep the count safe for downstream code (even when disabled)
	glossary_request_merge_count_effective = max(1, glossary_request_merge_count_raw)

	os.environ['GLOSSARY_REQUEST_MERGING_ENABLED'] = '1' if glossary_request_merging_enabled else '0'
	os.environ['GLOSSARY_REQUEST_MERGE_COUNT'] = str(glossary_request_merge_count_effective)
	os.environ['GLOSSARY_DUPLICATE_ALGORITHM'] = duplicate_algorithm
	# Use config defaults for gender context and description (manual glossary extraction)
	os.environ['GLOSSARY_INCLUDE_GENDER_CONTEXT'] = '1' if config.get('include_gender_context', True) else '0'
	os.environ['GLOSSARY_INCLUDE_DESCRIPTION'] = '1' if config.get('include_description', True) else '0'
	# Custom glossary fields (additional columns) - default to ['description']
	custom_fields = config.get('custom_glossary_fields', [])
	if not custom_fields and not config.get('custom_field_description_removed', False):
	custom_fields = ['description']
	os.environ['GLOSSARY_CUSTOM_FIELDS'] = json.dumps(custom_fields)
	os.environ['DISABLE_GEMINI_SAFETY'] = 'true'

	# Handle Thinking Toggle
	if not thinking:
	os.environ['ENABLE_GPT_THINKING'] = '0'
	os.environ['ENABLE_GEMINI_THINKING'] = '0'
	os.environ['ENABLE_DEEPSEEK_THINKING'] = '0'
	os.environ.pop('GPT_REASONING_TOKENS', None)
	sys.stderr.write(f"[CONFIG] Thinking capabilities disabled via command\n")
	else:
	# Set specific thinking variables if thinking is enabled
	os.environ['GEMINI_THINKING_LEVEL'] = gemini_thinking_level
	os.environ['THINKING_BUDGET'] = str(gemini_thinking_budget)
	os.environ['GPT_EFFORT'] = gpt_effort

	# Handle Vertex AI / Google Cloud credentials
	if '@' in model or model.startswith('vertex/'):
	# Prefer an uploaded credentials file; otherwise fall back to config.json.
	google_creds = None
	if google_credentials_file is not None:
	creds_name = os.path.basename(getattr(google_credentials_file, 'filename', '') or 'google_credentials.json')
	if not creds_name.lower().endswith('.json'):
	creds_name = 'google_credentials.json'
	google_creds = os.path.join(temp_dir, creds_name)
	try:
	await google_credentials_file.save(google_creds)
	except Exception as e:
	sys.stderr.write(f"[CONFIG] Failed to save uploaded Google credentials: {e}\n")
	google_creds = None

	if google_creds is None:
	google_creds = config.get('google_cloud_credentials')

	if google_creds and os.path.exists(google_creds):
	os.environ['GOOGLE_APPLICATION_CREDENTIALS'] = google_creds
	sys.stderr.write(f"[CONFIG] Using Google Cloud credentials: {os.path.basename(google_creds)}\n")
	sys.stderr.flush()

	try:
	with open(google_creds, 'r', encoding='utf-8') as f:
	creds_data = json.load(f)
	project_id = creds_data.get('project_id', 'vertex-ai-project')
	os.environ['GOOGLE_CLOUD_PROJECT'] = project_id
	if not api_key:
	api_key = project_id
	except Exception:
	pass

	# Set API key
	os.environ['API_KEY'] = api_key
	os.environ['OPENAI_API_KEY'] = api_key
	os.environ['OPENAI_OR_Gemini_API_KEY'] = api_key

	if 'claude' in model.lower():
	os.environ['ANTHROPIC_API_KEY'] = api_key
	elif 'gemini' in model.lower():
	os.environ['GOOGLE_API_KEY'] = api_key
	os.environ['GEMINI_API_KEY'] = api_key

	# Initialize extraction state
	user_id = interaction.user.id
	translation_states[user_id] = {
	'logs': [],
	'show_full': False,
	'stop_requested': False,
	'last_update': 0,
	'pending_update': False
	}
	state = translation_states[user_id]

	def log_callback(msg):
	if msg and msg.strip():
	state['logs'].append(msg.strip())
	sys.stderr.write(f"[LOG] {msg.strip()}\n")
	sys.stderr.flush()

	import time
	current_time = time.time()
	if current_time - state['last_update'] >= 1.0:
	state['last_update'] = current_time
	state['pending_update'] = False
	asyncio.run_coroutine_threadsafe(update_progress(), bot.loop)
	else:
	state['pending_update'] = True

	def stop_callback():
	return state['stop_requested']

	async def periodic_update_check():
	import time
	while user_id in translation_states and not state['stop_requested']:
	await asyncio.sleep(1)
	if state.get('pending_update', False):
	state['pending_update'] = False
	state['last_update'] = time.time()
	await update_progress()

	async def update_progress():
	try:
	logs = state['logs']
	if state['show_full']:
	log_text = '\n'.join(logs)
	if len(log_text) > 3900:
	log_text = "..." + log_text[-3900:]
	else:
	log_text = '\n'.join(logs[-10:])
	if len(log_text) > 800:
	log_text = log_text[-800:]

	if not log_text:
	log_text = "Starting..."

	embed = discord.Embed(
	title="📚 Glossary Extraction in Progress",
	description=f"Status: Processing... ({len(logs)} logs)\n\n```{log_text}```",
	color=discord.Color.blue()
	)

	view = LogView(user_id)
	await message.edit(embed=embed, view=view)
	except Exception as e:
	sys.stderr.write(f"[ERROR] Failed to update progress: {e}\n")
	sys.stderr.flush()

	await update_progress()
	update_task = asyncio.create_task(periodic_update_check())

	def run_extraction():
	_ensure_stable_cwd()

	sys.stderr.write(f"[EXTRACT] Starting glossary extraction for: {input_path}\\n")
	sys.stderr.write(f"[EXTRACT] Temp directory: {temp_dir}\\n")
	sys.stderr.flush()

	# Defensive checks: if these fail, raise an explicit error instead of a generic Errno 2.
	if not os.path.isdir(temp_dir):
	raise FileNotFoundError(f"Temp directory does not exist: {temp_dir}")
	if not os.path.isfile(input_path):
	raise FileNotFoundError(f"Input file does not exist: {input_path}")

	# Avoid chdir() to eliminate CWD-dependent bugs and races.
	# Use absolute output/config paths so the extractor is deterministic.
	output_base = os.path.splitext(os.path.basename(filename))[0] or "glossary"
	output_path = os.path.join(temp_dir, f"{output_base}_glossary.json")

	# Bot-only deployments often don't ship a config.json (it's gitignored).
	# The extractor currently expects a file path, so if one isn't present,
	# create a minimal config in the temp dir and rely on env vars (API_KEY, MODEL, etc.).
	config_path = CONFIG_FILE
	if not os.path.exists(config_path):
	config_path = os.path.join(temp_dir, "config.json")
	try:
	if not os.path.exists(config_path):
	with open(config_path, "w", encoding="utf-8") as f:
	json.dump({}, f)
	except Exception as e:
	# If we can't write a temp config for any reason, fall back to the original path
	# so the error message is explicit.
	sys.stderr.write(f"[EXTRACT] Failed to create temp config.json: {e}\n")
	sys.stderr.flush()
	config_path = CONFIG_FILE

	original_argv = sys.argv[:]
	try:
	sys.argv = [
	'extract_glossary_from_epub.py',
	'--epub', input_path,
	'--output', output_path,
	'--config', config_path
	]

	glossary_main(log_callback=log_callback, stop_callback=stop_callback)

	sys.stderr.write(f"[EXTRACT] Glossary extraction completed\n")
	sys.stderr.flush()
	return output_path
	finally:
	# Prevent leaking argv changes across commands.
	sys.argv = original_argv

	loop = asyncio.get_event_loop()
	extraction_future = loop.run_in_executor(None, run_extraction)
	output_filename = await extraction_future

	update_task.cancel()
	try:
	await update_task
	except asyncio.CancelledError:
	pass

	if state['stop_requested']:
	embed = discord.Embed(
	title="⏹️ Extraction Stopped",
	description="Glossary extraction was stopped by user.",
	color=discord.Color.orange()
	)
	await message.edit(embed=embed, view=None)
	return

	# Prefer the explicit output path returned by the extractor thread.
	# This avoids brittle "find the right file" scanning.
	output_file_path = None
	output_display_name = None
	is_zip_output = False

	try:
	if output_filename and os.path.isfile(output_filename):
	output_file_path = output_filename
	output_display_name = os.path.basename(output_filename)
	except Exception:
	pass

	glossary_dir = os.path.join(temp_dir, 'Glossary')

	# If a ZIP was requested, prefer zipping the Glossary directory if present;
	# otherwise, zip whatever single output file we produced.
	if send_zip:
	is_zip_output = True
	output_base = os.path.splitext(os.path.basename(filename))[0] or "glossary"
	zip_filename = f"{output_base}_glossary.zip"
	zip_path = os.path.join(temp_dir, zip_filename)

	import zipfile
	with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
	if os.path.exists(glossary_dir) and os.path.isdir(glossary_dir):
	for root, dirs, files in os.walk(glossary_dir):
	for file_item in files:
	file_path = os.path.join(root, file_item)
	arcname = os.path.relpath(file_path, glossary_dir)
	zipf.write(file_path, arcname)
	elif output_file_path and os.path.exists(output_file_path):
	zipf.write(output_file_path, os.path.basename(output_file_path))

	output_file_path = zip_path
	output_display_name = zip_filename

	# Legacy fallback: if we didn't get an explicit output file, try the historical Glossary/ folder.
	if not output_file_path:
	if os.path.exists(glossary_dir) and os.path.isdir(glossary_dir):
	for f in os.listdir(glossary_dir):
	if f.endswith('.csv'):
	output_file_path = os.path.join(glossary_dir, f)
	output_display_name = f
	break

	async def _dm_or_channel(content: str = None, embed: Optional[discord.Embed] = None, file: Optional[discord.File] = None):
	try:
	await interaction.user.send(content=content, embed=embed, file=file)
	return True
	except discord.Forbidden:
	try:
	await interaction.channel.send(content=content, embed=embed, file=file)
	return True
	except Exception:
	return False
	except Exception:
	return False

	# Send output
	if output_file_path and os.path.exists(output_file_path):
	file_size = os.path.getsize(output_file_path)

	if _should_offload(file_size, send_zip):
	loop = asyncio.get_event_loop()
	download_url = None
	for uploader, name in (( _upload_to_tempsh, "temp.sh"), (_upload_to_tmpfiles, "tmpfiles"), (_upload_to_oracle_par, "oracle"), (_upload_to_gofile, "gofile")):
	try:
	download_url = await loop.run_in_executor(
	None,
	functools.partial(uploader, output_file_path, output_display_name),
	)
	break
	except Exception as e2:
	sys.stderr.write(f"[HOST ERROR] {name}: {e2}\n")
	continue
	if download_url:
	embed = discord.Embed(
	title="✅ Glossary Extraction Complete!",
	description=(
	f"File: {output_display_name}\\n"
	f"Size: {file_size / 1024 / 1024:.2f}MB\\n"
	f"Download: <{download_url}>"
	),
	color=discord.Color.green()
	)
	await _dm_or_channel(embed=embed)
	else:
	await _dm_or_channel(
	content="Could not upload the glossary output right now. Please try again later."
	)
	else:
	embed = discord.Embed(
	title="✅ Glossary Extraction Complete!",
	description=f"File: {output_display_name}\nSize: {file_size / 1024:.2f}KB",
	color=discord.Color.green()
	)
	await _dm_or_channel(embed=embed)

	try:
	await _dm_or_channel(
	content=f"Here's your extracted glossary{(' (zipped)' if is_zip_output else '')}!",
	file=discord.File(output_file_path, filename=output_display_name),
	)
	except Exception:
	try:
	loop = asyncio.get_event_loop()
	download_url = await loop.run_in_executor(
	None,
	functools.partial(_upload_to_gofile, output_file_path, output_display_name),
	)
	await _dm_or_channel(
	content=f"Download: {download_url}",
	)
	except Exception:
	await _dm_or_channel(
	content="Upload failed and Gofile is unavailable right now."
	)
	else:
	embed = discord.Embed(
	title="❌ Extraction Failed",
	description="Could not find or prepare glossary output file",
	color=discord.Color.red()
	)
	await _dm_or_channel(embed=embed)

	except Exception as e:
	import traceback
	error = f"```\n{traceback.format_exc()[-1000:]}\n```"
	embed = discord.Embed(
	title="❌ Error",
	description=f"{str(e)}\n{error}",
	color=discord.Color.red()
	)
	await message.edit(embed=embed, view=None)

	finally:
	# Ensure the background extraction thread has finished before removing temp_dir.
	# If we delete early, the executor thread can crash with FileNotFoundError.
	try:
	if 'state' in locals():
	state['stop_requested'] = True
	except Exception:
	pass

	try:
	if 'update_task' in locals() and update_task:
	update_task.cancel()
	except Exception:
	pass

	try:
	if 'extraction_future' in locals() and extraction_future and not extraction_future.done():
	try:
	await asyncio.wait_for(extraction_future, timeout=10)
	except Exception:
	# If it doesn't finish quickly, don't delete the directory out from under it.
	pass
	except Exception:
	pass

	if user_id in translation_states:
	del translation_states[user_id]

	try:
	if os.path.exists(temp_dir):
	shutil.rmtree(temp_dir)
	except Exception:
	pass


	@bot.tree.command(name="models", description="List available AI models")
	async def models(interaction: discord.Interaction):
	"""List available models"""
	if GLOSSARION_AVAILABLE:
	model_list = get_model_options()

	# Group by provider
	providers = {}
	for model in model_list:
	provider = model.split('-')[0] if '-' in model else model
	if provider not in providers:
	providers[provider] = []
	providers[provider].append(model)

	embed = discord.Embed(
	title="🤖 Available Models",
	description="Use with `/translate`",
	color=discord.Color.blue()
	)

	for provider, mods in list(providers.items())[:10]:
	text = '\n'.join([f"• `{m}`" for m in mods[:5]])
	if len(mods) > 5:
	text += f"\n• ... +{len(mods) - 5} more"
	embed.add_field(name=provider.upper(), value=text, inline=True)

	await _safe_send_message(interaction, embed=embed, ephemeral=_ephemeral(interaction))
	else:
	await _safe_send_message(interaction, "❌ Not available", ephemeral=_ephemeral(interaction))


	@bot.tree.command(name="help", description="Show help")
	async def help_command(interaction: discord.Interaction):
	"""Show help"""
	embed = discord.Embed(
	title="📚 Glossarion Discord Bot",
	description="Translate EPUB/TXT files using AI",
	color=discord.Color.blue()
	)

	embed.add_field(
	name="Commands",
	value="`/save` - Store encrypted API key/model\n`/translate` - Translate file\n`/extract` - Extract glossary\n`/models` - List models\n`/help` - This message\n\nUse `send_zip: True` to force ZIP output.",
	inline=False
	)

	embed.add_field(
	name="Example",
	value="```\n/translate\n file: novel.epub\n api_key: sk-...\n model: gpt-4\n target_language: English\n```",
	inline=False
	)

	embed.add_field(
	name="Notes",
	value=(
	"• Files over 25MB auto-hosted for 24h (shared 5GB cap)\n"
	"• Uses your Glossarion config\n"
	"• API key not stored"
	),
	inline=False
	)

	await _safe_send_message(interaction, embed=embed, ephemeral=_ephemeral(interaction))


	def main():
	"""Start bot"""
	token = os.getenv('DISCORD_BOT_TOKEN')

	if not token:
	print("❌ DISCORD_BOT_TOKEN not set!")
	print("\nSetup:")
	print("1. Create bot at https://discord.com/developers/applications")
	print("2. Get token from Bot section")
	print("3. Set environment variable:")
	print(" Windows: set DISCORD_BOT_TOKEN=your_token")
	print(" Linux/Mac: export DISCORD_BOT_TOKEN=your_token")
	print("4. Invite bot with 'bot' + 'applications.commands' scopes")
	return

	if not GLOSSARION_AVAILABLE:
	print("⚠️ Glossarion not available - translations will fail")

	print("🚀 Starting Glossarion Discord Bot...")
	bot.run(token)


	if __name__ == "__main__":
	from shutdown_utils import run_cli_main
	run_cli_main(main)