Spaces:

DLPO
/

api_light_hf

Sleeping

App Files Files Community

api_light_hf / migrate_apis.py

Renecto

deploy api_light_hf (2026-03-12 12:47:03)

cf7f643 4 days ago

raw

history blame contribute delete

6.93 kB

	"""
	Migration script: transforms api_light_dev/apis/*.py files
	to work with the new HF-based LLMClient.
	Injects _ask_raw_hf helper, removes OpenAI imports, updates model defaults.
	"""
	import os
	import re

	SRC_DIR = r"C:\Users\caris\cursor\DD\api_light_dev\apis"
	DST_DIR = r"C:\Users\caris\cursor\DD\api_light_hf\apis"

	HF_HELPER = '''

	def _ask_raw_hf(messages, model, response_format=None):
	"""Compatibility wrapper: routes OpenAI-style messages through HF LLMClient."""
	from src.clients.llm_client import LLMClient
	import json as _json

	client = LLMClient()
	system_prompt = None
	user_text = ""
	images = []
	for msg in messages:
	role = msg.get("role", "")
	c = msg.get("content", "")
	if role == "system":
	if isinstance(c, str):
	system_prompt = c
	elif role == "user":
	if isinstance(c, str):
	user_text = c
	elif isinstance(c, list):
	for part in c:
	if isinstance(part, dict):
	if part.get("type") == "text":
	user_text += part.get("text", "")
	elif part.get("type") == "image_url":
	url = part.get("image_url", {}).get("url", "")
	if url.startswith("data:"):
	images.append(url.split(",", 1)[1] if "," in url else url)
	else:
	images.append(url)

	if response_format is not None and hasattr(response_format, "model_json_schema"):
	result = client.call(
	prompt=user_text,
	schema=response_format,
	model=model,
	system_prompt=system_prompt,
	images=images if images else None,
	temperature=0,
	)
	return _json.dumps(result.model_dump(), ensure_ascii=False)
	else:
	return client.call_raw(
	prompt=user_text,
	model=model,
	system_prompt=system_prompt,
	images=images if images else None,
	)

	'''

	MODEL_REPLACEMENTS = [
	('"gpt-4o-2024-08-06"', '"meta-llama/Llama-3.3-70B-Instruct"'),
	('"gpt-4o-2024-11-20"', '"meta-llama/Llama-3.3-70B-Instruct"'),
	('"gpt-4o"', '"meta-llama/Llama-3.3-70B-Instruct"'),
	('"gpt-4o-mini"', '"meta-llama/Llama-3.1-8B-Instruct"'),
	('"gemini-2.5-pro"', '"Qwen/Qwen2.5-VL-72B-Instruct"'),
	('"gemini-2.5-flash-image"', '"black-forest-labs/FLUX.1-dev"'),
	('"gemini-3-pro-image-preview"', '"black-forest-labs/FLUX.1-dev"'),
	('"gemini-3-flash-preview"', '"Qwen/Qwen2.5-VL-72B-Instruct"'),
	('"gemini-1.5-flash-preview-0514"', '"meta-llama/Llama-3.2-11B-Vision-Instruct"'),
	('"ft:gpt-4o-mini-2024-07-18:dlpo-inc:ecinfo-extractor:Cg036C3l"', '"meta-llama/Llama-3.1-8B-Instruct"'),
	('model="gpt-4o"', 'model="meta-llama/Llama-3.3-70B-Instruct"'),
	('model="gpt-4o-mini"', 'model="meta-llama/Llama-3.1-8B-Instruct"'),
	('model="gpt-4o-2024-08-06"', 'model="meta-llama/Llama-3.3-70B-Instruct"'),
	('model="gemini-3-flash-preview"', 'model="Qwen/Qwen2.5-VL-72B-Instruct"'),
	('selected_model = model if model else "gpt-4o"', 'selected_model = model if model else "meta-llama/Llama-3.3-70B-Instruct"'),
	]


	def find_last_import_line(lines):
	last = -1
	for i, line in enumerate(lines):
	if line.startswith("import ") or line.startswith("from "):
	last = i
	return last


	def transform_file(content):
	changed = False

	# --- 1. Remove Gradio imports/request params ---
	new = re.sub(r'import gradio as gr\r?\n', '', content)
	new = re.sub(r'from src\.utils\.tracer import \*', 'from src.utils.tracer import customtracer', new)
	new = re.sub(r',?\srequest:\sgr\.Request', '', new)
	new = re.sub(r'request:\sgr\.Request,?\s', '', new)

	# --- 2. Model replacements ---
	for old, rep in MODEL_REPLACEMENTS:
	new = new.replace(old, rep)

	# --- 3. OpenAI → LLMClient ---
	if "from openai import OpenAI" in new or "OpenAI()" in new:
	# Remove openai imports
	new = re.sub(r'import openai\r?\n', '', new)
	new = re.sub(r'from openai import OpenAI\r?\n', '', new)

	# Add LLMClient import if not present
	if "from src.clients" not in new:
	new = re.sub(r'(import os\r?\n)', r'\1from src.clients.llm_client import LLMClient\n', new)

	# Inject helper after last import (only once)
	if "_ask_raw_hf" not in new:
	lines = new.split("\n")
	idx = find_last_import_line(lines)
	if idx >= 0:
	before = "\n".join(lines[:idx+1])
	after = "\n".join(lines[idx+1:])
	new = before + HF_HELPER + after
	else:
	new = HF_HELPER + new

	# Replace ask_raw body (simple def pattern)
	new = re.sub(
	r'def ask_raw\(messages,\sm\s\):\s*\n'
	r'(?:\s+[^\n]+\n)*?'
	r'\s+return response\.choices\[0\]\.message\.content',
	'def ask_raw(messages, m):\n return _ask_raw_hf(messages, m)',
	new,
	flags=re.MULTILINE
	)

	# Replace ask_raw with explicit response_format parameter
	# pattern: def ask_raw(messages, m): ... response_format=SCHEMA ... return ...
	new = re.sub(
	r'def ask_raw\(messages,\sm\s\):\s*\n'
	r'(?:\s+[^\n]+\n)*?',
	lambda m: m.group(0), # preserve – handled by generic above
	new,
	flags=re.MULTILINE
	)

	# Replace any remaining client = OpenAI()
	new = re.sub(r'client = OpenAI\([^)]*\)', 'client = LLMClient()', new)

	# Replace client.beta.chat.completions.parse calls remaining in function bodies
	# These are in nayose_fv, ecinfo2winningrate, etc.
	new = re.sub(
	r'response = client\.beta\.chat\.completions\.parse\(',
	'response = _ask_raw_hf([{"role":"user","content":p}], model,',
	new
	)
	# Clean up leftover response.choices[0] patterns
	new = re.sub(
	r'response\.choices\[0\]\.message\.(?:content\|parsed)',
	'response',
	new
	)

	if new != content:
	changed = True
	return new, changed


	def main():
	files = [f for f in os.listdir(DST_DIR) if f.endswith(".py") and not f.startswith("__")]
	updated = 0
	for fname in sorted(files):
	path = os.path.join(DST_DIR, fname)
	with open(path, "r", encoding="utf-8", errors="replace") as f:
	content = f.read()
	new_content, changed = transform_file(content)
	if changed:
	with open(path, "w", encoding="utf-8") as f:
	f.write(new_content)
	updated += 1
	print(f"Updated {updated}/{len(files)} files")


	if __name__ == "__main__":
	main()