Spaces:

ethonmax
/

picpocket2

Paused

picpocket2 / utils.py

chawin.chen

init

7a6cb13 about 2 months ago

37.1 kB

	import base64
	import hashlib
	import os
	import re
	import shutil
	import threading
	import time
	from concurrent.futures import ThreadPoolExecutor, as_completed
	from typing import Optional
	from collections import OrderedDict

	import cv2
	import numpy as np
	from PIL import Image

	try:
	import boto3
	from botocore.exceptions import BotoCoreError, ClientError
	except ImportError:
	boto3 = None
	BotoCoreError = ClientError = Exception

	from config import (
	IMAGES_DIR,
	logger,
	SAVE_QUALITY,
	MODELS_PATH,
	BOS_ACCESS_KEY,
	BOS_SECRET_KEY,
	BOS_ENDPOINT,
	BOS_BUCKET_NAME,
	BOS_IMAGE_DIR,
	BOS_UPLOAD_ENABLED,
	BOS_DOWNLOAD_TARGETS,
	HUGGINGFACE_REPO_ID,
	HUGGINGFACE_SYNC_ENABLED,
	HUGGINGFACE_REVISION,
	HUGGINGFACE_ALLOW_PATTERNS,
	HUGGINGFACE_IGNORE_PATTERNS,
	)

	_BOS_CLIENT = None
	_BOS_CLIENT_INITIALIZED = False
	_BOS_CLIENT_LOCK = threading.Lock()
	_BOS_DOWNLOAD_LOCK = threading.Lock()
	_BOS_DOWNLOAD_COMPLETED = False
	_BOS_BACKGROUND_EXECUTOR = None
	_BOS_BACKGROUND_FUTURES = []
	_IMAGES_DIR_ABS = os.path.abspath(os.path.expanduser(IMAGES_DIR))
	_BOS_UPLOAD_CACHE = OrderedDict()
	_BOS_UPLOAD_CACHE_LOCK = threading.Lock()
	_BOS_UPLOAD_CACHE_MAX = 2048


	def _decode_bos_credential(raw_value: str) -> str:
	"""将Base64编码的凭证解码为明文，若解码失败则返回原值"""
	if not raw_value:
	return ""

	value = raw_value.strip()
	if not value:
	return ""

	try:
	padding = len(value) % 4
	if padding:
	value += "=" * (4 - padding)
	decoded = base64.b64decode(value).decode("utf-8").strip()
	if decoded:
	return decoded
	except Exception:
	pass
	return value


	def _is_path_under_images_dir(file_path: str) -> bool:
	try:
	return os.path.commonpath(
	[_IMAGES_DIR_ABS, os.path.abspath(file_path)]
	) == _IMAGES_DIR_ABS
	except ValueError:
	return False


	def _get_bos_client():
	global _BOS_CLIENT, _BOS_CLIENT_INITIALIZED
	if _BOS_CLIENT_INITIALIZED:
	return _BOS_CLIENT

	with _BOS_CLIENT_LOCK:
	if _BOS_CLIENT_INITIALIZED:
	return _BOS_CLIENT

	if not BOS_UPLOAD_ENABLED:
	_BOS_CLIENT_INITIALIZED = True
	_BOS_CLIENT = None
	return None
	access_key = _decode_bos_credential(BOS_ACCESS_KEY)
	secret_key = _decode_bos_credential(BOS_SECRET_KEY)
	if not all([access_key, secret_key, BOS_ENDPOINT, BOS_BUCKET_NAME]):
	logger.warning("BOS 上传未配置完整，跳过初始化")
	_BOS_CLIENT_INITIALIZED = True
	_BOS_CLIENT = None
	return None

	if boto3 is None:
	logger.warning("未安装 boto3，BOS 上传功能不可用")
	_BOS_CLIENT_INITIALIZED = True
	_BOS_CLIENT = None
	return None

	try:
	_BOS_CLIENT = boto3.client(
	"s3",
	aws_access_key_id=access_key,
	aws_secret_access_key=secret_key,
	endpoint_url=BOS_ENDPOINT,
	)
	logger.info("BOS 客户端初始化成功")
	except Exception as e:
	logger.warning(f"初始化 BOS 客户端失败，将跳过上传: {e}")
	_BOS_CLIENT = None
	finally:
	_BOS_CLIENT_INITIALIZED = True

	return _BOS_CLIENT


	def _normalize_bos_prefix(prefix: Optional[str]) -> str:
	value = (prefix or "").strip()
	if not value:
	return ""
	value = value.strip("/")
	if not value:
	return ""
	return f"{value}/" if not value.endswith("/") else value


	def _directory_has_files(path: str) -> bool:
	try:
	for _root, _dirs, files in os.walk(path):
	if files:
	return True
	except Exception:
	return False
	return False


	def download_bos_directory(prefix: str, destination_dir: str, *, force_download: bool = False) -> bool:
	"""
	将 BOS 上的指定前缀目录同步到本地。
	:param prefix: BOS 对象前缀，例如 'models/' 或 '20220620/models'
	:param destination_dir: 本地目标目录
	:param force_download: 是否强制重新下载（忽略本地已存在的文件）
	:return: 是否确保目录可用
	"""
	client = _get_bos_client()
	if client is None:
	logger.warning("BOS 客户端不可用，无法下载资源（prefix=%s）", prefix)
	return False

	dest_dir = os.path.abspath(os.path.expanduser(destination_dir))
	try:
	os.makedirs(dest_dir, exist_ok=True)
	except Exception as exc:
	logger.error("创建本地目录失败: %s (%s)", dest_dir, exc)
	return False

	normalized_prefix = _normalize_bos_prefix(prefix)

	# 未强制下载且目录已有文件时直接跳过，避免重复下载
	if not force_download and _directory_has_files(dest_dir):
	logger.info("本地目录已存在文件，跳过下载: %s -> %s", normalized_prefix or "<root>", dest_dir)
	return True

	paginate_kwargs = {"Bucket": BOS_BUCKET_NAME}
	if normalized_prefix:
	paginate_kwargs["Prefix"] = normalized_prefix if normalized_prefix.endswith("/") else f"{normalized_prefix}/"

	found_any = False
	downloaded = 0
	skipped = 0

	try:
	paginator = client.get_paginator("list_objects_v2")
	for page in paginator.paginate(**paginate_kwargs):
	for obj in page.get("Contents", []):
	key = obj.get("Key")
	if not key:
	continue
	if normalized_prefix:
	prefix_with_slash = normalized_prefix if normalized_prefix.endswith("/") else f"{normalized_prefix}/"
	if not key.startswith(prefix_with_slash):
	continue
	relative_key = key[len(prefix_with_slash):]
	else:
	relative_key = key

	if not relative_key or relative_key.endswith("/"):
	continue
	found_any = True

	target_path = os.path.join(dest_dir, relative_key)
	target_dir = os.path.dirname(target_path)
	os.makedirs(target_dir, exist_ok=True)

	expected_size = obj.get("Size")
	if (
	not force_download
	and os.path.exists(target_path)
	and expected_size is not None
	and expected_size == os.path.getsize(target_path)
	):
	skipped += 1
	logger.info("文件已存在且大小一致，跳过下载: %s", relative_key)
	continue

	tmp_path = f"{target_path}.download"
	try:
	size_mb = (expected_size or 0) / (1024 * 1024)
	logger.info("开始下载: %s (%.2f MB)", relative_key, size_mb)
	client.download_file(Bucket=BOS_BUCKET_NAME, Key=key, Filename=tmp_path)
	os.replace(tmp_path, target_path)
	downloaded += 1
	logger.info("下载完成: %s", relative_key)
	except Exception as exc:
	logger.warning("下载失败: %s (%s)", key, exc)
	try:
	if os.path.exists(tmp_path):
	os.remove(tmp_path)
	except Exception:
	pass
	except Exception as exc:
	logger.warning("遍历 BOS 目录失败: %s", exc)
	return False

	if not found_any:
	logger.warning("在 BOS 桶 %s 中未找到前缀 '%s' 的内容", BOS_BUCKET_NAME, normalized_prefix or "<root>")
	return False

	logger.info(
	"BOS 同步完成 prefix=%s -> %s 下载=%d 跳过=%d",
	normalized_prefix or "<root>",
	dest_dir,
	downloaded,
	skipped,
	)
	return downloaded > 0 or skipped > 0


	def _get_background_executor() -> ThreadPoolExecutor:
	global _BOS_BACKGROUND_EXECUTOR
	if _BOS_BACKGROUND_EXECUTOR is None:
	_BOS_BACKGROUND_EXECUTOR = ThreadPoolExecutor(max_workers=2, thread_name_prefix="bos-bg")
	return _BOS_BACKGROUND_EXECUTOR


	def ensure_huggingface_models(force_download: bool = False) -> bool:
	"""确保 HuggingFace 模型仓库同步到本地 MODELS_PATH。"""
	if not HUGGINGFACE_SYNC_ENABLED:
	logger.info("HuggingFace 模型同步开关已关闭，跳过同步流程")
	return True

	repo_id = (HUGGINGFACE_REPO_ID or "").strip()
	if not repo_id:
	logger.info("未配置 HuggingFace 仓库，跳过模型下载")
	return True

	try:
	from huggingface_hub import snapshot_download
	except ImportError:
	logger.error("未安装 huggingface-hub，无法下载 HuggingFace 模型")
	return False

	try:
	os.makedirs(MODELS_PATH, exist_ok=True)
	except Exception as exc:
	logger.error("创建模型目录失败: %s (%s)", MODELS_PATH, exc)
	return False

	download_kwargs = {
	"repo_id": repo_id,
	"local_dir": MODELS_PATH,
	"local_dir_use_symlinks": False,
	}

	revision = (HUGGINGFACE_REVISION or "").strip()
	if revision:
	download_kwargs["revision"] = revision

	if HUGGINGFACE_ALLOW_PATTERNS:
	download_kwargs["allow_patterns"] = HUGGINGFACE_ALLOW_PATTERNS

	if HUGGINGFACE_IGNORE_PATTERNS:
	download_kwargs["ignore_patterns"] = HUGGINGFACE_IGNORE_PATTERNS

	if force_download:
	download_kwargs["force_download"] = True
	download_kwargs["resume_download"] = False
	else:
	download_kwargs["resume_download"] = True

	try:
	logger.info(
	"开始同步 HuggingFace 模型: repo=%s revision=%s -> %s",
	repo_id,
	revision or "<default>",
	MODELS_PATH,
	)
	snapshot_path = snapshot_download(**download_kwargs)
	logger.info(
	"HuggingFace 模型同步完成: %s -> %s",
	repo_id,
	snapshot_path,
	)
	return True
	except Exception as exc:
	logger.error("HuggingFace 模型下载失败: %s", exc)
	return False


	def ensure_bos_resources(force_download: bool = False, include_background: bool = False) -> bool:
	"""
	根据配置的 BOS_DOWNLOAD_TARGETS 同步启动所需的模型与数据资源。
	:param force_download: 是否强制重新同步所有资源
	:param include_background: 是否将标记为后台任务的目标也同步为阻塞任务
	:return: 资源是否已准备就绪
	"""
	global _BOS_DOWNLOAD_COMPLETED, _BOS_BACKGROUND_FUTURES

	with _BOS_DOWNLOAD_LOCK:
	if _BOS_DOWNLOAD_COMPLETED and not force_download and not include_background:
	return True

	targets = BOS_DOWNLOAD_TARGETS or []
	if not targets:
	logger.info("未配置 BOS 下载目标，跳过资源同步")
	_BOS_DOWNLOAD_COMPLETED = True
	return True

	download_jobs = []
	background_jobs = []
	for target in targets:
	if not isinstance(target, dict):
	logger.warning("无效的 BOS 下载配置项: %r", target)
	continue

	prefix = target.get("bos_prefix")
	destination = target.get("destination")
	description = target.get("description") or prefix or "<unnamed>"
	background_flag = bool(target.get("background"))

	if not prefix or not destination:
	logger.warning("缺少必要字段，无法处理 BOS 下载配置: %r", target)
	continue

	job = {
	"description": description,
	"prefix": prefix,
	"destination": destination,
	}

	if background_flag and not include_background:
	background_jobs.append(job)
	else:
	download_jobs.append(job)

	results = []
	if download_jobs:
	max_workers = min(len(download_jobs), max(os.cpu_count() or 1, 1))
	if max_workers <= 0:
	max_workers = 1

	with ThreadPoolExecutor(max_workers=max_workers, thread_name_prefix="bos-sync") as executor:
	future_to_job = {}
	for job in download_jobs:
	logger.info(
	"准备同步 BOS 资源: %s (prefix=%s -> %s)",
	job["description"],
	job["prefix"],
	job["destination"],
	)
	future = executor.submit(
	download_bos_directory,
	job["prefix"],
	job["destination"],
	force_download=force_download,
	)
	future_to_job[future] = job

	for future in as_completed(future_to_job):
	job = future_to_job[future]
	description = job["description"]
	try:
	success = future.result()
	except Exception as exc:
	logger.warning("BOS 资源同步异常: %s (%s)", description, exc)
	success = False

	if success:
	logger.info("BOS 资源已就绪: %s", description)
	else:
	logger.warning("BOS 资源同步失败: %s", description)
	results.append(success)

	all_ready = all(results) if results else True
	if all_ready:
	_BOS_DOWNLOAD_COMPLETED = True

	if background_jobs:
	executor = _get_background_executor()

	def _make_callback(description: str):
	def _background_done(fut):
	try:
	success = fut.result()
	if success:
	logger.info("后台 BOS 资源已就绪: %s", description)
	else:
	logger.warning("后台 BOS 资源同步失败: %s", description)
	except Exception as exc:
	logger.warning("后台 BOS 资源同步异常: %s (%s)", description, exc)
	finally:
	with _BOS_DOWNLOAD_LOCK:
	if fut in _BOS_BACKGROUND_FUTURES:
	_BOS_BACKGROUND_FUTURES.remove(fut)
	return _background_done

	for job in background_jobs:
	logger.info(
	"后台同步 BOS 资源: %s (prefix=%s -> %s)",
	job["description"],
	job["prefix"],
	job["destination"],
	)
	future = executor.submit(
	download_bos_directory,
	job["prefix"],
	job["destination"],
	force_download=force_download,
	)
	future.add_done_callback(_make_callback(job["description"]))
	_BOS_BACKGROUND_FUTURES.append(future)

	return all_ready


	def upload_file_to_bos(file_path: str, object_name: str \| None = None) -> bool:
	"""
	将指定文件同步上传到 BOS，失败不会抛出异常。
	:param file_path: 本地文件路径
	:param object_name: BOS 对象名称（可选）
	:return: 是否成功上传
	"""
	if not BOS_UPLOAD_ENABLED:
	return False

	start_time = time.perf_counter()
	expanded_path = os.path.abspath(os.path.expanduser(file_path))
	if not os.path.isfile(expanded_path):
	return False

	if not _is_path_under_images_dir(expanded_path):
	# 仅上传 IMAGES_DIR 内的文件，避免将临时文件同步至 BOS
	return False

	try:
	file_stat = os.stat(expanded_path)
	except OSError:
	return False

	if _get_bos_client() is None:
	return False

	# 生成对象名称
	if object_name:
	object_key = object_name.strip("/ ")
	else:
	base_name = os.path.basename(expanded_path)
	if BOS_IMAGE_DIR:
	object_key = "/".join(
	part.strip("/ ") for part in (BOS_IMAGE_DIR, base_name) if part
	)
	else:
	object_key = base_name

	mtime_ns = getattr(file_stat, "st_mtime_ns", int(file_stat.st_mtime * 1_000_000_000))
	cache_signature = (mtime_ns, file_stat.st_size)
	cache_key = (expanded_path, object_key)

	with _BOS_UPLOAD_CACHE_LOCK:
	cached_signature = _BOS_UPLOAD_CACHE.get(cache_key)
	if cached_signature is not None:
	_BOS_UPLOAD_CACHE.move_to_end(cache_key)

	if cached_signature == cache_signature:
	elapsed_ms = (time.perf_counter() - start_time) * 1000
	logger.info("文件已同步至 BOS（跳过重复上传，耗时 %.1f ms）: %s", elapsed_ms, object_key)
	return True

	def _do_upload(mode_label: str) -> bool:
	client_inner = _get_bos_client()
	if client_inner is None:
	return False
	upload_start = time.perf_counter()
	try:
	client_inner.upload_file(expanded_path, BOS_BUCKET_NAME, object_key)
	elapsed_ms = (time.perf_counter() - upload_start) * 1000
	logger.info("文件已同步至 BOS（%s，耗时 %.1f ms）: %s", mode_label, elapsed_ms, object_key)
	with _BOS_UPLOAD_CACHE_LOCK:
	_BOS_UPLOAD_CACHE[cache_key] = cache_signature
	_BOS_UPLOAD_CACHE.move_to_end(cache_key)
	while len(_BOS_UPLOAD_CACHE) > _BOS_UPLOAD_CACHE_MAX:
	_BOS_UPLOAD_CACHE.popitem(last=False)
	return True
	except (ClientError, BotoCoreError, Exception) as exc:
	logger.warning("上传到 BOS 失败（%s，%s）: %s", object_key, mode_label, exc)
	return False

	return _do_upload("同步")


	def delete_file_from_bos(file_path: str \| None = None,
	object_name: str \| None = None) -> bool:
	"""
	删除 BOS 中的指定对象，失败不会抛出异常。
	:param file_path: 本地文件路径（可选，用于推导文件名）
	:param object_name: BOS 对象名称（可选，优先使用）
	:return: 是否成功删除
	"""
	if not BOS_UPLOAD_ENABLED:
	return False

	client = _get_bos_client()
	if client is None:
	return False

	key_candidate = object_name.strip("/ ") if object_name else ""

	if not key_candidate and file_path:
	base_name = os.path.basename(
	os.path.abspath(os.path.expanduser(file_path)))
	key_candidate = base_name.strip()

	if not key_candidate:
	return False

	if BOS_IMAGE_DIR:
	object_key = "/".join(
	part.strip("/ ") for part in (BOS_IMAGE_DIR, key_candidate) if part
	)
	else:
	object_key = key_candidate

	try:
	client.delete_object(Bucket=BOS_BUCKET_NAME, Key=object_key)
	logger.info(f"已从 BOS 删除文件: {object_key}")
	return True
	except (ClientError, BotoCoreError, Exception) as e:
	logger.warning(f"删除 BOS 文件失败（{object_key}）: {e}")
	return False


	def image_to_base64(image: np.ndarray) -> str:
	"""将OpenCV图像转换为base64字符串"""
	if image is None or image.size == 0:
	return ""
	_, buffer = cv2.imencode(".webp", image, [cv2.IMWRITE_WEBP_QUALITY, 90])
	img_base64 = base64.b64encode(buffer).decode("utf-8")
	return f"data:image/webp;base64,{img_base64}"


	def save_base64_to_unique_file(
	base64_string: str, output_dir: str = "output_images"
	) -> str \| None:
	"""
	将带有MIME类型前缀的Base64字符串解码并保存到本地。
	文件名格式为: {md5_hash}_{timestamp}.{extension}
	"""
	os.makedirs(output_dir, exist_ok=True)

	try:
	match = re.match(r"data:(image/\w+);base64,(.+)", base64_string)
	if match:
	mime_type = match.group(1)
	base64_data = match.group(2)
	else:
	mime_type = "image/jpeg"
	base64_data = base64_string

	extension_map = {
	"image/jpeg": "jpg",
	"image/png": "png",
	"image/gif": "gif",
	"image/webp": "webp",
	}
	file_extension = extension_map.get(mime_type, "webp")

	decoded_data = base64.b64decode(base64_data)

	except (ValueError, TypeError, base64.binascii.Error) as e:
	logger.error(f"Base64 decoding failed: {e}")
	return None

	md5_hash = hashlib.md5(base64_data.encode("utf-8")).hexdigest()
	filename = f"{md5_hash}.{file_extension}"
	file_path = os.path.join(output_dir, filename)

	try:
	with open(file_path, "wb") as f:
	f.write(decoded_data)
	return file_path
	except IOError as e:
	logger.error(f"File writing failed: {e}")
	return None


	def human_readable_size(size_bytes):
	"""人性化文件大小展示"""
	for unit in ["B", "KB", "MB", "GB"]:
	if size_bytes < 1024:
	return f"{size_bytes:.1f} {unit}"
	size_bytes /= 1024
	return f"{size_bytes:.1f} TB"


	def delete_file(file_path: str):
	try:
	os.remove(file_path)
	logger.info(f"Deleted file: {file_path}")
	except Exception as error:
	logger.error(f"Failed to delete file {file_path}: {error}")


	def move_file_to_archive(file_path: str):
	try:
	if not os.path.exists(IMAGES_DIR):
	os.makedirs(IMAGES_DIR)
	filename = os.path.basename(file_path)
	destination = os.path.join(IMAGES_DIR, filename)
	shutil.move(file_path, destination)
	logger.info(f"Moved file to archive: {destination}")
	except Exception as error:
	logger.error(f"Failed to move file {file_path} to archive: {error}")


	def save_image_high_quality(
	image: np.ndarray,
	output_path: str,
	quality: int = SAVE_QUALITY,
	*,
	upload_to_bos: bool = True,
	) -> bool:
	"""
	保存图像，保持高质量，不进行压缩
	:param image: 图像数组
	:param output_path: 输出路径
	:param quality: WebP质量 (0-100)，默认95
	:param upload_to_bos: 是否在写入后同步至 BOS
	:return: 保存是否成功
	"""
	try:
	success, encoded_img = cv2.imencode(
	".webp", image, [cv2.IMWRITE_WEBP_QUALITY, quality]
	)
	if not success:
	logger.error(f"Image encoding failed: {output_path}")
	return False

	with open(output_path, "wb") as f:
	f.write(encoded_img)

	logger.info(f"High quality image saved successfully: {output_path}, quality: {quality}, size: {len(encoded_img) / 1024:.2f} KB")
	if upload_to_bos:
	upload_file_to_bos(output_path)
	return True
	except Exception as e:
	logger.error(f"Failed to save image: {output_path}, error: {e}")
	return False


	def convert_numpy_types(obj):
	"""转换所有 numpy 类型为原生 Python 类型"""
	if isinstance(obj, (np.float32, np.float64)):
	return float(obj)
	elif isinstance(obj, (np.int32, np.int64)):
	return int(obj)
	elif isinstance(obj, dict):
	return {k: convert_numpy_types(v) for k, v in obj.items()}
	elif isinstance(obj, list):
	return [convert_numpy_types(i) for i in obj]
	else:
	return obj


	def compress_image_by_quality(image: np.ndarray, quality: int, output_format: str = 'webp') -> tuple[bytes, dict]:
	"""
	按质量压缩图像
	:param image: 输入图像
	:param quality: 压缩质量 (10-100)
	:param output_format: 输出格式 ('jpg', 'png', 'webp')
	:return: (压缩后的图像字节数据, 压缩信息)
	"""
	try:
	height, width = image.shape[:2]

	if output_format.lower() == 'png':
	# PNG使用压缩级别 (0-9)，质量参数转换为压缩级别
	compression_level = max(0, min(9, int((100 - quality) / 10)))
	success, encoded_img = cv2.imencode(
	".png", image, [cv2.IMWRITE_PNG_COMPRESSION, compression_level]
	)
	elif output_format.lower() == 'webp':
	# WebP支持质量参数
	success, encoded_img = cv2.imencode(
	".webp", image, [cv2.IMWRITE_WEBP_QUALITY, quality]
	)
	else:
	# JPG格式
	success, encoded_img = cv2.imencode(
	".jpg", image, [cv2.IMWRITE_JPEG_QUALITY, quality]
	)

	if not success:
	raise Exception("图像编码失败")

	compressed_bytes = encoded_img.tobytes()

	info = {
	'original_dimensions': f"{width} × {height}",
	'compressed_dimensions': f"{width} × {height}",
	'quality': quality,
	'format': output_format.upper(),
	'size': len(compressed_bytes)
	}

	return compressed_bytes, info

	except Exception as e:
	logger.error(f"Failed to compress image by quality: {e}")
	raise


	def compress_image_by_dimensions(image: np.ndarray, target_width: int, target_height: int,
	quality: int = 100, output_format: str = 'jpg') -> tuple[bytes, dict]:
	"""
	按尺寸压缩图像
	:param image: 输入图像
	:param target_width: 目标宽度
	:param target_height: 目标高度
	:param quality: 压缩质量
	:param output_format: 输出格式
	:return: (压缩后的图像字节数据, 压缩信息)
	"""
	try:
	original_height, original_width = image.shape[:2]

	# 调整图像尺寸
	resized_image = cv2.resize(
	image, (target_width, target_height),
	interpolation=cv2.INTER_AREA
	)

	# 按质量编码
	if output_format.lower() == 'png':
	compression_level = max(0, min(9, int((100 - quality) / 10)))
	success, encoded_img = cv2.imencode(
	".png", resized_image, [cv2.IMWRITE_PNG_COMPRESSION, compression_level]
	)
	elif output_format.lower() == 'webp':
	success, encoded_img = cv2.imencode(
	".webp", resized_image, [cv2.IMWRITE_WEBP_QUALITY, quality]
	)
	else:
	success, encoded_img = cv2.imencode(
	".jpg", resized_image, [cv2.IMWRITE_JPEG_QUALITY, quality]
	)

	if not success:
	raise Exception("图像编码失败")

	compressed_bytes = encoded_img.tobytes()

	info = {
	'original_dimensions': f"{original_width} × {original_height}",
	'compressed_dimensions': f"{target_width} × {target_height}",
	'quality': quality,
	'format': output_format.upper(),
	'size': len(compressed_bytes)
	}

	return compressed_bytes, info

	except Exception as e:
	logger.error(f"Failed to compress image by dimensions: {e}")
	raise


	def compress_image_by_file_size(image: np.ndarray, target_size_kb: float,
	output_format: str = 'jpg') -> tuple[bytes, dict]:
	"""
	按文件大小压缩图像 - 使用多阶段二分法精确控制大小
	:param image: 输入图像
	:param target_size_kb: 目标文件大小（KB）
	:param output_format: 输出格式
	:return: (压缩后的图像字节数据, 压缩信息)
	"""
	try:
	original_height, original_width = image.shape[:2]
	target_size_bytes = int(target_size_kb * 1024)

	def encode_image(img, quality):
	"""编码图像并返回字节数据"""
	if output_format.lower() == 'png':
	compression_level = max(0, min(9, int((100 - quality) / 10)))
	success, encoded_img = cv2.imencode(
	".png", img, [cv2.IMWRITE_PNG_COMPRESSION, compression_level]
	)
	elif output_format.lower() == 'webp':
	success, encoded_img = cv2.imencode(
	".webp", img, [cv2.IMWRITE_WEBP_QUALITY, quality]
	)
	else:
	success, encoded_img = cv2.imencode(
	".jpg", img, [cv2.IMWRITE_JPEG_QUALITY, quality]
	)

	if success:
	return encoded_img.tobytes()
	return None

	def find_best_scale_and_quality(target_bytes):
	"""寻找最佳的尺寸和质量组合"""
	best_result = None
	best_diff = float('inf')

	# 尝试多个尺寸比例
	test_scales = [1.0, 0.95, 0.9, 0.85, 0.8, 0.75, 0.7, 0.65, 0.6, 0.55, 0.5, 0.45, 0.4, 0.35, 0.3]

	for scale in test_scales:
	# 调整图像尺寸
	if scale < 1.0:
	new_width = int(original_width * scale)
	new_height = int(original_height * scale)
	if new_width < 50 or new_height < 50: # 避免尺寸太小
	continue
	working_image = cv2.resize(image, (new_width, new_height), interpolation=cv2.INTER_AREA)
	else:
	working_image = image
	new_width, new_height = original_width, original_height

	# 在这个尺寸下使用二分法寻找最佳质量
	min_q, max_q = 10, 100
	scale_best_result = None
	scale_best_diff = float('inf')

	for _ in range(20): # 每个尺寸最多尝试20次质量调整
	current_quality = (min_q + max_q) // 2

	compressed_bytes = encode_image(working_image, current_quality)
	if not compressed_bytes:
	break

	current_size = len(compressed_bytes)
	size_diff = abs(current_size - target_bytes)
	size_ratio = current_size / target_bytes

	# 如果找到精确匹配，立即返回
	if 0.99 <= size_ratio <= 1.01: # 1%误差以内
	return {
	'bytes': compressed_bytes,
	'scale': scale,
	'width': new_width,
	'height': new_height,
	'quality': current_quality,
	'size': current_size,
	'ratio': size_ratio
	}

	# 记录该尺寸下的最佳结果
	if size_diff < scale_best_diff:
	scale_best_diff = size_diff
	scale_best_result = {
	'bytes': compressed_bytes,
	'scale': scale,
	'width': new_width,
	'height': new_height,
	'quality': current_quality,
	'size': current_size,
	'ratio': size_ratio
	}

	# 二分法调整质量
	if current_size > target_bytes:
	max_q = current_quality - 1
	else:
	min_q = current_quality + 1

	if min_q >= max_q:
	break

	# 更新全局最佳结果
	if scale_best_result and scale_best_diff < best_diff:
	best_diff = scale_best_diff
	best_result = scale_best_result

	# 如果已经找到很好的结果（5%以内），可以提前结束
	if best_result and 0.95 <= best_result['ratio'] <= 1.05:
	break

	return best_result

	logger.info(f"Starting multi-stage compression, target size: {target_size_bytes} bytes ({target_size_kb}KB)")

	# 寻找最佳组合
	result = find_best_scale_and_quality(target_size_bytes)

	if result:
	error_percent = abs(result['ratio'] - 1) * 100
	logger.info(f"Compression completed: scale ratio {result['scale']:.2f}, quality {result['quality']}%, "
	f"size {result['size']} bytes, error {error_percent:.2f}%")

	# 不管误差多大都返回最接近的结果，只记录警告
	if error_percent > 10:
	if result['ratio'] < 0.5: # 压缩过度
	suggested_size = result['size'] / 1024
	logger.warning(f"Target size {target_size_kb}KB is too small, actually compressed to {suggested_size:.1f}KB, error {error_percent:.1f}%")
	elif result['ratio'] > 2.0: # 无法达到目标
	suggested_size = result['size'] / 1024
	logger.warning(f"Target size {target_size_kb}KB is too large, minimum can be compressed to {suggested_size:.1f}KB, error {error_percent:.1f}%")
	else:
	logger.warning(f"Cannot achieve target accuracy, error {error_percent:.1f}%, returning closest result")

	info = {
	'original_dimensions': f"{original_width} × {original_height}",
	'compressed_dimensions': f"{result['width']} × {result['height']}",
	'quality': result['quality'],
	'format': output_format.upper(),
	'size': result['size']
	}

	return result['bytes'], info
	else:
	raise Exception(f"无法将图片压缩到目标大小 {target_size_kb}KB")

	except Exception as e:
	logger.error(f"Failed to compress image by file size: {e}")
	raise


	def convert_image_format(image: np.ndarray, target_format: str, quality: int = 100) -> tuple[bytes, dict]:
	"""
	转换图像格式
	:param image: 输入图像
	:param target_format: 目标格式 ('jpg', 'png', 'webp')
	:param quality: 质量参数
	:return: (转换后的图像字节数据, 格式信息)
	"""
	try:
	height, width = image.shape[:2]

	if target_format.lower() == 'png':
	# PNG格式，使用压缩级别
	compression_level = 6 # 默认压缩级别
	success, encoded_img = cv2.imencode(
	".png", image, [cv2.IMWRITE_PNG_COMPRESSION, compression_level]
	)
	elif target_format.lower() == 'webp':
	# WebP格式
	success, encoded_img = cv2.imencode(
	".webp", image, [cv2.IMWRITE_WEBP_QUALITY, quality]
	)
	else:
	# JPG格式
	success, encoded_img = cv2.imencode(
	".jpg", image, [cv2.IMWRITE_JPEG_QUALITY, quality]
	)

	if not success:
	raise Exception("图像格式转换失败")

	converted_bytes = encoded_img.tobytes()

	info = {
	'original_dimensions': f"{width} × {height}",
	'compressed_dimensions': f"{width} × {height}",
	'quality': quality if target_format.lower() != 'png' else 100,
	'format': target_format.upper(),
	'size': len(converted_bytes)
	}

	return converted_bytes, info

	except Exception as e:
	logger.error(f"Image format conversion failed: {e}")
	raise


	def save_image_with_transparency(image: np.ndarray, file_path: str) -> bool:
	"""
	保存带透明通道的图像为PNG格式
	:param image: OpenCV图像数组(BGRA格式，包含alpha通道)
	:param file_path: 保存路径
	:return: 保存是否成功
	"""
	if image is None:
	logger.error("Image is empty, cannot save")
	return False

	try:
	# 确保目录存在
	os.makedirs(os.path.dirname(file_path), exist_ok=True)

	# 如果图像有4个通道(BGRA)，转换为RGBA然后保存
	if len(image.shape) == 3 and image.shape[2] == 4:
	# BGRA转换为RGBA
	rgba_image = cv2.cvtColor(image, cv2.COLOR_BGRA2RGBA)
	elif len(image.shape) == 3 and image.shape[2] == 3:
	# 如果是BGR格式，先转换为RGB，但这种情况不应该有透明度
	rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
	rgba_image = np.dstack((rgb_image, np.full(rgb_image.shape[:2], 255, dtype=np.uint8)))
	else:
	logger.error("Image format does not support transparency saving")
	return False

	# 使用PIL保存PNG
	pil_image = Image.fromarray(rgba_image, 'RGBA')
	pil_image.save(file_path, 'PNG', optimize=True)

	file_size = os.path.getsize(file_path)
	logger.info(f"Transparent PNG image saved: {file_path}, size: {file_size/1024:.1f}KB")
	upload_file_to_bos(file_path)
	return True

	except Exception as e:
	logger.error(f"Failed to save transparent PNG image: {e}")
	return False