Spaces:

basilboy
/

SelfOrganisingText

Sleeping

App Files Files Community

SelfOrganisingText / app.py

basilboy

Update app.py

b862b43 verified 5 months ago

raw

history blame contribute delete

24.6 kB

	# app.py
	import os, re, math, random, json
	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	import gradio as gr
	from transformers import AutoTokenizer
	from safetensors.torch import load_file as load_sft
	from huggingface_hub import snapshot_download

	torch.set_default_dtype(torch.float32)

	# ===============================================
	# Default config (from your training notes)
	# ===============================================
	DEFAULT_CONF = {
	"embed_dim": 1024,
	"num_heads": 8,
	"expansion_factor": 4,
	"num_blocks": 8,
	"radius": 16,
	"tokenizer_name": "gpt2",
	}

	# ===============================================
	# Minimal CNA (inference-ready)
	# ===============================================
	class AttnBlock(nn.Module):
	def __init__(self, embed_dim, num_heads, expansion_factor):
	super().__init__()
	assert embed_dim % num_heads == 0, "embed_dim must be divisible by num_heads"
	self.embed_dim = embed_dim
	self.num_heads = num_heads
	self.head_dim = embed_dim // num_heads

	self.norm1 = nn.LayerNorm(embed_dim)
	self.QKV = nn.Linear(embed_dim, embed_dim * 3)
	self.Wo = nn.Linear(embed_dim, embed_dim)

	self.norm2 = nn.LayerNorm(embed_dim)
	self.mlp = nn.Sequential(
	nn.Linear(embed_dim, embed_dim * expansion_factor),
	nn.GELU(),
	nn.Linear(embed_dim * expansion_factor, embed_dim),
	)

	# zero-init residual branches (match training)
	nn.init.zeros_(self.Wo.weight); nn.init.zeros_(self.Wo.bias)
	nn.init.zeros_(self.mlp[-1].weight); nn.init.zeros_(self.mlp[-1].bias)

	def rope(self, Qh, Kh_seq, cos, sin):
	Qe = Qh[..., 0::2]; Qo = Qh[..., 1::2]
	ce = cos[..., 0::2]; se = sin[..., 0::2]
	Qr_e = Qe * ce - Qo * se
	Qr_o = Qe * se + Qo * ce
	Qh2 = torch.empty_like(Qh); Qh2[..., 0::2] = Qr_e; Qh2[..., 1::2] = Qr_o

	Ke = Kh_seq[..., 0::2]; Ko = Kh_seq[..., 1::2]
	Kr_e = Ke * ce - Ko * se
	Kr_o = Ke * se + Ko * ce
	Kh2 = torch.empty_like(Kh_seq); Kh2[..., 0::2] = Kr_e; Kh2[..., 1::2] = Kr_o
	return Qh2, Kh2

	def forward(self, x, rope, radius):
	# keep LN inputs & params same dtype
	if x.dtype != self.norm1.weight.dtype:
	x = x.to(self.norm1.weight.dtype)

	h = self.norm1(x)
	B, S, E = h.shape
	cos, sin = rope
	nh, hd = self.num_heads, self.head_dim

	cos = cos.to(h.dtype).to(h.device).permute(0,2,1,3) # [1,1,S,hd]
	sin = sin.to(h.dtype).to(h.device).permute(0,2,1,3)

	# local band mask
	idx = torch.arange(S, device=h.device)
	idx_dist = (idx.view(1, S) - idx.view(S, 1)).abs()
	neg_inf = torch.finfo(h.dtype).min
	mask = torch.full((S, S), neg_inf, dtype=h.dtype, device=h.device)
	mask[idx_dist <= int(radius)] = 0
	mask = mask.view(1, 1, S, S)

	qkv = self.QKV(h)
	q, k, v = qkv.chunk(3, dim=-1)

	Qh = q.view(B,S,nh,hd).permute(0,2,1,3).contiguous()
	Kh_seq = k.view(B,S,nh,hd).permute(0,2,1,3).contiguous()
	Vh = v.view(B,S,nh,hd).permute(0,2,1,3).contiguous()

	assert hd % 2 == 0, "rope needs even head_dim"
	Qh, Kh_seq = self.rope(Qh, Kh_seq, cos, sin)
	Kh = Kh_seq.permute(0,1,3,2).contiguous()

	logits = (Qh @ Kh) * (hd ** -0.5)
	attn = F.softmax(logits + mask, dim=-1) @ Vh
	attn = attn.permute(0,2,1,3).contiguous().view(B,S,E)

	x = x + self.Wo(attn)
	x = x + self.mlp(self.norm2(x))
	return x

	class CNA(nn.Module):
	def __init__(self, embed_dim, num_heads, expansion_factor, num_blocks, radius, vocab_size):
	super().__init__()
	self.embed_dim = embed_dim
	self.num_heads = num_heads
	self.expansion_factor = expansion_factor
	self.num_blocks = num_blocks
	self.vocab_size = vocab_size
	self.radius = radius
	self.tok_emb = nn.Embedding(vocab_size, embed_dim)
	self.blocks = nn.ModuleList([AttnBlock(embed_dim, num_heads, expansion_factor) for _ in range(num_blocks)])
	self.proj = nn.Linear(embed_dim, vocab_size)

	def _rope_seq(self, S, hd, device, dtype, base=10000.0):
	pos = torch.arange(S, device=device, dtype=dtype)
	half = hd // 2
	idx = torch.arange(half, device=device, dtype=dtype)
	inv = base ** (-idx / half)
	ang = pos[:, None] * inv[None, :]
	cos = ang.cos().unsqueeze(0).unsqueeze(2)
	sin = ang.sin().unsqueeze(0).unsqueeze(2)
	cos = torch.stack((cos, cos), dim=-1).reshape(1, S, 1, hd)
	sin = torch.stack((sin, sin), dim=-1).reshape(1, S, 1, hd)
	return cos, sin

	def forward(self, x):
	if x.dtype == torch.long and x.dim() == 2:
	h = self.tok_emb(x)
	else:
	h = x
	# ensure embeddings/activations dtype follows model dtype
	target_dtype = next(self.parameters()).dtype
	if h.dtype != target_dtype:
	h = h.to(target_dtype)

	B, S, E = h.shape
	hd = self.embed_dim // self.num_heads
	cos, sin = self._rope_seq(S, hd, h.device, h.dtype)
	for blk in self.blocks:
	h = blk(h, rope=(cos, sin), radius=self.radius)
	return self.proj(h)

	# ===============================================
	# Helpers
	# ===============================================
	def to_batch2(ids_like) -> torch.Tensor:
	"""
	Normalize ids_like (list, [[...]], tensor) to int64 shape [1, S].
	Accepts [S], [1,S], [1,1,S]; returns [1,S].
	"""
	x = torch.tensor(ids_like, dtype=torch.long)
	if x.dim() == 1:
	x = x.unsqueeze(0) # [S] -> [1,S]
	elif x.dim() == 3 and x.shape[0] == 1 and x.shape[1] == 1:
	x = x.squeeze(1) # [1,1,S] -> [1,S]
	elif x.dim() != 2:
	x = x.view(1, -1) # fallback reshape
	return x

	def infer_expansion_factor_from_state(state, embed_dim):
	for key in ("blocks.0.mlp.0.weight", "blocks.0.mlp.2.weight"):
	if key in state:
	W = state[key]
	if key.endswith("0.weight"):
	return int(W.shape[0] // embed_dim)
	else:
	return int(W.shape[1] // embed_dim)
	return DEFAULT_CONF["expansion_factor"]

	@torch.no_grad()
	def decode(ids, tokenizer, max_chars=1000):
	s = tokenizer.decode(ids.tolist(), skip_special_tokens=True)
	s = s.replace("\n", " ")
	return s[:max_chars] + ("…" if len(s) > max_chars else "")

	@torch.no_grad()
	def model_logits(model, x):
	return model(x)

	def to_fixed_len_ids(text, tokenizer, seqlen, pad_mode="random", rnd=None):
	if rnd is None:
	rnd = random.Random()
	ids = tokenizer.encode(text, add_special_tokens=False)
	V = tokenizer.vocab_size
	if len(ids) >= seqlen:
	ids = ids[:seqlen]
	else:
	need = seqlen - len(ids)
	if pad_mode == "eos" and tokenizer.eos_token_id is not None:
	ids = ids + [tokenizer.eos_token_id] * need
	else:
	ids = ids + [rnd.randrange(V) for _ in range(need)]
	return torch.tensor(ids, dtype=torch.long).unsqueeze(0)

	def apply_noise_ops(x, tokenizer, indices_csv, add_noise_left, add_noise_right, seqlen, seed=0):
	rnd = random.Random(seed)
	V = tokenizer.vocab_size
	x = x.clone()

	idxs = set()
	if indices_csv and indices_csv.strip():
	for part in indices_csv.split(","):
	part = part.strip()
	if not part: continue
	if "-" in part:
	a, b = part.split("-", 1)
	try:
	a, b = int(a), int(b)
	for j in range(min(a,b), max(a,b)+1):
	idxs.add(j)
	except:
	pass
	else:
	try:
	idxs.add(int(part))
	except:
	pass
	for j in idxs:
	if 0 <= j < x.shape[1]:
	x[0, j] = rnd.randrange(V)

	if add_noise_left > 0:
	prefix = torch.tensor([rnd.randrange(V) for _ in range(int(add_noise_left))], dtype=torch.long).unsqueeze(0)
	x = torch.cat([prefix, x], dim=1)
	if add_noise_right > 0:
	suffix = torch.tensor([rnd.randrange(V) for _ in range(int(add_noise_right))], dtype=torch.long).unsqueeze(0)
	x = torch.cat([x, suffix], dim=1)

	if x.shape[1] > seqlen:
	x = x[:, :seqlen]
	elif x.shape[1] < seqlen:
	need = seqlen - x.shape[1]
	pad = torch.tensor([rnd.randrange(V) for _ in range(need)], dtype=torch.long).unsqueeze(0)
	x = torch.cat([x, pad], dim=1)
	return x

	@torch.no_grad()
	def sample_from_logits(logits_row, temperature=1.0, current_token=None, exclude_current=True):
	if temperature <= 0:
	return int(torch.argmax(logits_row).item())
	scaled = logits_row / float(temperature)
	probs = torch.softmax(scaled, dim=-1)
	if exclude_current and current_token is not None:
	probs = probs.clone()
	probs[current_token] = 0.0
	s = probs.sum()
	if s.item() <= 0:
	return int(torch.argmax(logits_row).item())
	probs = probs / s
	return int(torch.multinomial(probs, 1).item())

	# ===============================================
	# Weight loading (file / folder / HF Hub)
	# ===============================================
	DEFAULT_CKPT = os.environ.get("CKPT_PATH", "ckpt_latest.pt")
	DEFAULT_WEIGHTS_DIR = os.environ.get("WEIGHTS_DIR", "weights_latest")

	def _read_config_from_dict_or_infer(state, cfg):
	merged = {DEFAULT_CONF, (cfg or {})}
	if "tok_emb.weight" in state:
	merged["embed_dim"] = state["tok_emb.weight"].shape[1]
	block_idxs = [int(m.group(1)) for k in state.keys() for m in [re.match(r"blocks\.(\d+)\.", k)] if m]
	if block_idxs:
	merged["num_blocks"] = max(block_idxs) + 1
	if "blocks.0.mlp.0.weight" in state or "blocks.0.mlp.2.weight" in state:
	merged["expansion_factor"] = infer_expansion_factor_from_state(state, merged["embed_dim"])
	if not merged.get("tokenizer_name"):
	merged["tokenizer_name"] = "gpt2"
	return merged

	def _is_state_dict(obj):
	if isinstance(obj, dict) and obj:
	sample_val = next(iter(obj.values()))
	return isinstance(sample_val, torch.Tensor)
	return False

	def _load_state_from_pt(path: str):
	obj = torch.load(path, map_location="cpu")
	if isinstance(obj, dict) and "model" in obj and isinstance(obj["model"], dict):
	state = obj["model"]
	cfg = obj.get("config", {}) or {}
	if "tokenizer_name" in obj:
	cfg = {**cfg, "tokenizer_name": obj["tokenizer_name"]}
	return state, cfg
	if _is_state_dict(obj):
	return obj, {}
	raise ValueError(f"Unsupported .pt format at {path}: expected a state_dict or a payload with 'model'.")

	def _merge_state_dicts(dicts):
	merged = {}
	for d in dicts:
	for k, v in d.items():
	merged[k] = v
	return merged

	def _load_state_from_folder(weights_dir: str):
	if not os.path.isdir(weights_dir):
	raise FileNotFoundError(f"Folder not found: {weights_dir}")

	cfg_path = os.path.join(weights_dir, "config.json")
	cfg = {}
	if os.path.exists(cfg_path):
	with open(cfg_path, "r") as f:
	cfg = json.load(f)

	files = sorted(os.listdir(weights_dir))
	sft_files = [f for f in files if f.endswith(".safetensors")]
	pt_files = [f for f in files if f.endswith(".pt") or f.endswith(".bin")]

	state = None
	if "model.safetensors" in sft_files:
	state = load_sft(os.path.join(weights_dir, "model.safetensors"))
	elif sft_files:
	parts = [load_sft(os.path.join(weights_dir, f)) for f in sft_files]
	state = _merge_state_dicts(parts)
	elif pt_files:
	parts = []
	for f in pt_files:
	part = torch.load(os.path.join(weights_dir, f), map_location="cpu")
	if isinstance(part, dict) and "model" in part and isinstance(part["model"], dict):
	parts.append(part["model"])
	if "config" in part and isinstance(part["config"], dict):
	cfg = {cfg, part["config"]}
	if "tokenizer_name" in part:
	cfg.setdefault("tokenizer_name", part["tokenizer_name"])
	elif _is_state_dict(part):
	parts.append(part)
	else:
	raise ValueError(f"Unsupported shard format: {f}")
	state = _merge_state_dicts(parts)
	else:
	raise FileNotFoundError(
	f"No weights found in {weights_dir}. Expected .safetensors or .pt files."
	)

	return state, cfg

	def _load_state_from_hub(repo_id: str, subfolder: str \| None = None, revision: str \| None = None):
	cache_dir = snapshot_download(repo_id=repo_id, revision=revision, allow_patterns=None)
	path = os.path.join(cache_dir, subfolder) if subfolder else cache_dir
	return _load_state_from_folder(path)

	def load_model(source: str):
	src = source or ""
	state, cfg = None, {}

	if os.path.isfile(src) and (src.endswith(".pt") or src.endswith(".bin")):
	state, cfg = _load_state_from_pt(src)
	elif os.path.isdir(src):
	state, cfg = _load_state_from_folder(src)
	elif "/" in src: # Hub repo id
	subfolder = os.environ.get("WEIGHTS_SUBFOLDER") or None
	revision = os.environ.get("WEIGHTS_REVISION") or None
	state, cfg = _load_state_from_hub(src, subfolder=subfolder, revision=revision)
	else:
	# fallbacks
	if os.path.isfile("weights_latest.pt"):
	state, cfg = _load_state_from_pt("weights_latest.pt")
	elif os.path.isfile(DEFAULT_CKPT):
	state, cfg = _load_state_from_pt(DEFAULT_CKPT)
	elif os.path.isdir(DEFAULT_WEIGHTS_DIR):
	state, cfg = _load_state_from_folder(DEFAULT_WEIGHTS_DIR)
	else:
	raise FileNotFoundError(
	f"Could not resolve weights from '{src}'. Tried file (.pt), folder, hub repo id, "
	f"then defaults ('{DEFAULT_CKPT}', '{DEFAULT_WEIGHTS_DIR}')."
	)

	conf = _read_config_from_dict_or_infer(state, cfg)

	# Tokenizer
	tokenizer = AutoTokenizer.from_pretrained(conf["tokenizer_name"], use_fast=True)
	if tokenizer.pad_token is None:
	tokenizer.pad_token = tokenizer.eos_token
	tokenizer.model_max_length = 1_000_000_000
	vocab_size = tokenizer.vocab_size

	# Build model
	model = CNA(
	conf["embed_dim"], conf["num_heads"], conf["expansion_factor"],
	conf["num_blocks"], conf["radius"], vocab_size
	)

	# Load state (tolerate projection size mismatch)
	missing, unexpected = model.load_state_dict(state, strict=False)
	if any(k.startswith("proj.") for k in missing):
	with torch.no_grad():
	nn.init.normal_(model.proj.weight, std=0.02)
	nn.init.zeros_(model.proj.bias)
	else:
	model.load_state_dict(state, strict=True)

	# enforce float32 across params & buffers
	model = model.to(torch.float32)
	with torch.no_grad():
	for p in model.parameters():
	if p.dtype.is_floating_point:
	p.data = p.data.float()
	for _, buf in model.named_buffers():
	if buf.dtype.is_floating_point:
	buf.data = buf.data.float()

	model.eval()
	return model, tokenizer, conf["radius"]

	model_cache = {"model": None, "tokenizer": None, "radius": None, "ckpt": None}

	def _auto_default_source():
	env = os.environ.get("WEIGHTS_SOURCE")
	if env:
	return env
	if os.path.isdir("weights_latest"):
	return "weights_latest"
	for name in ["weights_latest.pt", "ckpt_latest.pt"]:
	if os.path.isfile(name):
	return name
	for f in sorted(os.listdir(".")):
	if f.endswith(".pt") or f.endswith(".safetensors"):
	return f
	return "weights_latest.pt"

	def ensure_model(source_path_or_repo):
	src = source_path_or_repo or _auto_default_source()
	if model_cache["model"] is None or model_cache["ckpt"] != src:
	m, tok, rad = load_model(src)
	model_cache.update({"model": m, "tokenizer": tok, "radius": rad, "ckpt": src})

	# ===============================================
	# Strategy 1 (random position) with argmax / sample
	# ===============================================
	@torch.no_grad()
	def step_strategy1(model, x, mode="argmax", temperature=1.0, exclude_current=True):
	S = x.shape[1]
	pos = int(torch.randint(0, S, (1,)).item())
	logits_pos = model_logits(model, x)[0, pos]
	if mode == "sample":
	cur_tok = int(x[0, pos].item())
	new_tok = sample_from_logits(logits_pos, temperature=float(temperature),
	current_token=cur_tok, exclude_current=bool(exclude_current))
	x[0, pos] = new_tok
	else:
	x[0, pos] = int(torch.argmax(logits_pos).item())
	return x

	# ===============================================
	# Gradio callbacks
	# ===============================================
	def init_random(src, seqlen, seed):
	ensure_model(src)
	random.seed(seed); torch.manual_seed(seed)
	V = model_cache["tokenizer"].vocab_size
	x = torch.randint(0, V, (1, int(seqlen)))
	txt = decode(x[0], model_cache["tokenizer"])
	return x.tolist(), txt, f"Initialized random sequence (len={int(seqlen)})"

	def to_ranges(indices):
	"""Compress a sorted list of token indices into 'a-b' CSV."""
	if not indices:
	return ""
	indices = sorted(set(indices))
	ranges = []
	start = prev = indices[0]
	for i in indices[1:]:
	if i == prev + 1:
	prev = i
	else:
	ranges.append((start, prev))
	start = prev = i
	ranges.append((start, prev))
	parts = [f"{a}-{b}" if a != b else f"{a}" for a, b in ranges]
	return ", ".join(parts)

	def capture_selection(text, seqlen, current_ids, evt: gr.SelectData \| None = None):
	"""
	Map highlighted character span in `text` to token index ranges using tokenizer offsets.
	Auto-fills the indices box so you can 'Noise Selection'.
	"""
	ensure_model(None)
	tok = model_cache["tokenizer"]

	if not text:
	return gr.update(), "No text to select from."

	# Try to read (start, end) from the event payload
	start, end = None, None
	if evt is not None:
	try:
	# gradio SelectData for Textbox exposes .index = (start_char, end_char)
	start, end = evt.index
	except Exception:
	pass
	# Fallback: nothing selected
	if start is None or end is None or start == end:
	return gr.update(), "No selection detected (drag to highlight)."

	# Bound the indices defensively
	start = max(0, min(len(text), int(start)))
	end = max(0, min(len(text), int(end)))

	# Get per-token char offsets from the fast tokenizer
	enc = tok(text, add_special_tokens=False, return_offsets_mapping=True)
	offsets = enc["offset_mapping"] # list of (s,e) per token
	token_idxs = []
	for i, (s, e) in enumerate(offsets):
	if s is None or e is None:
	continue
	# overlap if token span intersects [start, end)
	if max(s, start) < min(e, end):
	token_idxs.append(i)

	if not token_idxs:
	return gr.update(), "Selection didn't hit any tokens (maybe whitespace)."

	# Clip to current sequence length (so we don't index beyond S)
	S = int(seqlen)
	token_idxs = [i for i in token_idxs if i < S]

	if not token_idxs:
	return gr.update(), "Selected span maps beyond current sequence length."

	indices_csv = to_ranges(token_idxs)
	return indices_csv, f"Selected chars [{start}:{end}) → tokens {indices_csv}"

	def noise_selection(src, state_ids, seqlen, indices_csv, seed):
	# Reuse apply_noise but force prepend/append noise to zero
	return apply_noise(src, state_ids, seqlen, indices_csv, 0, 0, seed)


	def apply_noise(src, state_ids, seqlen, indices_csv, add_left, add_right, seed):
	ensure_model(src)
	tok = model_cache["tokenizer"]
	S = int(seqlen)
	if state_ids is None or len(state_ids) == 0:
	V = tok.vocab_size
	base = torch.randint(0, V, (1, S))
	else:
	base = to_batch2(state_ids)
	x = apply_noise_ops(base, tok, indices_csv, int(add_left or 0), int(add_right or 0), S, seed=seed)
	txt = decode(x[0], tok)
	return x.tolist(), txt, "Applied noise"

	def step_once(src, state_ids, mode, temperature, exclude_current):
	ensure_model(src)
	tok = model_cache["tokenizer"]
	if state_ids is None or len(state_ids) == 0:
	return None, "", "No sequence to step — initialize first."
	x = to_batch2(state_ids)
	x = step_strategy1(model_cache["model"], x, mode=mode, temperature=temperature, exclude_current=exclude_current)
	txt = decode(x[0], tok)
	return x.tolist(), txt, f"Stepped 1 iteration ({mode})"

	def live_denoise(src, state_ids, steps, snap_every, seed, mode, temperature, exclude_current):
	ensure_model(src)
	tok = model_cache["tokenizer"]
	if state_ids is None or len(state_ids) == 0:
	return
	random.seed(seed); torch.manual_seed(seed)
	x = to_batch2(state_ids)
	total = int(steps); snap = max(1, int(snap_every))
	for t in range(1, total + 1):
	x = step_strategy1(model_cache["model"], x, mode=mode, temperature=temperature, exclude_current=exclude_current)
	if (t % snap == 0) or (t == total):
	txt = decode(x[0], tok)
	yield x.tolist(), txt, f"Live denoise… step {t}/{total} ({mode})"

	# ===============================================
	# UI (single mode)
	# ===============================================
	with gr.Blocks(title="Self Organising Text Demo") as demo:
	gr.Markdown(
	"""
	# Self Organising Text Demo
	Watch text self organise using only local attention.
	"""
	)

	default_source = os.environ.get("WEIGHTS_SOURCE", None)
	if default_source is None:
	default_source = _auto_default_source()

	with gr.Row():
	src = gr.Textbox(value=default_source, label="Weights (file / folder / HF repo id)")
	seqlen = gr.Slider(10, 512, value=50, step=1, label="Sequence length (S)")
	seed = gr.Slider(0, 10000, value=0, step=1, label="Seed")

	ids_state = gr.State(value=None)

	with gr.Row():
	current_text = gr.Textbox(lines=8, label="Current text", interactive=True)
	status = gr.Markdown("Ready.")

	gr.Markdown("### Initialize & Denoise")
	with gr.Row():
	btn_random = gr.Button("Initialize Random")
	steps = gr.Slider(1, 2000, value=100, step=1, label="Denoise steps (N)") # default 100
	snap_every = gr.Slider(1, 100, value=1, step=1, label="Update every K steps") # default 1
	with gr.Row():
	update_mode = gr.Radio(
	choices=["argmax", "sample"],
	value="sample", # default to sampling
	label="Update rule"
	)
	temperature = gr.Slider(minimum=0.0, maximum=5.0, value=1.0, step=0.05, label="Temperature (sampling)")
	exclude_current = gr.Checkbox(value=True, label="Exclude current token when sampling")
	with gr.Row():
	btn_step_once = gr.Button("Step Once")
	btn_live = gr.Button("Denoise Live (streaming)")

	gr.Markdown("### Noise by Indices")
	with gr.Row():
	indices_csv = gr.Textbox(
	label="Positions to noise (enter like: 0, 5, 10-20)",
	placeholder="e.g., 0, 5, 10-20"
	)
	with gr.Row():
	add_left = gr.Number(value=0, precision=0, label="Noise tokens to add at START")
	add_right = gr.Number(value=0, precision=0, label="Noise tokens to add at END")
	btn_apply_noise = gr.Button("Apply Noise")



	# --- Wiring ---
	btn_random.click(init_random, [src, seqlen, seed], [ids_state, current_text, status])



	# Manual indices + prepend/append noise
	btn_apply_noise.click(
	apply_noise,
	[src, ids_state, seqlen, indices_csv, add_left, add_right, seed],
	[ids_state, current_text, status]
	)

	btn_step_once.click(
	step_once,
	[src, ids_state, update_mode, temperature, exclude_current],
	[ids_state, current_text, status]
	)

	btn_live.click(
	live_denoise,
	[src, ids_state, steps, snap_every, seed, update_mode, temperature, exclude_current],
	[ids_state, current_text, status],
	show_progress=True
	)

	demo.queue().launch()