Spaces:

Mfischthal
/

DialogueExtractor

Sleeping

DialogueExtractor / teacher.py

Upload 6 files

758613a verified 2 months ago

1.59 kB

	import os, time
	from typing import Optional
	from openai import OpenAI

	INSTRUCTION = """You are a dialogue structuring assistant for multi-speaker TTS.

	Map characters to speakers dynamically within each passage (first distinct speaker you detect -> Speaker 1, second -> Speaker 2, etc.).

	Requirements:
	- Detect speaker changes from context (“said/replied/asked/…”).
	- Output lines strictly as:
	Speaker 1: …
	Speaker 2: …
	(and so on)
	- Label narration (non-dialogue) as Speaker 1.
	- Remove dialogue attribution tags (e.g., “he said”), EXCEPT when the narrator speaks in first person; keep those inline (e.g., “I said”).
	- Preserve original order and content; no omissions or rewrites.
	- Return only the formatted lines, no extra commentary.
	"""

	MODEL = os.getenv("OPENAI_MODEL", "gpt-4o-mini")
	client = OpenAI() # uses OPENAI_API_KEY

	STRICT_SUFFIX = "\n\nIMPORTANT: Every line must start with 'Speaker N: ' and include at least two lines."

	def call_teacher(passage: str, temperature: float = 0.0, max_retries: int = 2) -> Optional[str]:
	model = os.getenv("OPENAI_MODEL", MODEL)
	prompt = f"{INSTRUCTION}\n\nText:\n{passage}"
	for i in range(max_retries + 1):
	try:
	resp = client.responses.create(
	model=model,
	input=prompt,
	temperature=temperature,
	)
	out = resp.output_text
	if out and out.strip():
	return out
	except Exception:
	time.sleep(0.5 * (i + 1))
	prompt = prompt + STRICT_SUFFIX
	return None