Spaces:

Aluode
/

StockCheck

Running

App Files Files Community

StockCheck / stock.py

Aluode

Upload 6 files

3151dff verified 1 day ago

Raw

History Blame Contribute Delete

11.3 kB

	"""
	stock.py — "Did this stock actually change?" on free Yahoo data (no API key).

	Finance-native use of the same machinery, honestly matched to how prices behave:
	* SHOCK events — the Clutch's MagnitudeGate fed with \|daily return\| / typical move.
	A single outsized day trips it instantly; several stressed days in a
	row accumulate and trip it too (which a naive threshold misses).
	* VOLATILITY regime changes — the iid change detector (change.detect) run on rolling
	daily volatility: "a normal day used to be ±1.1%, now it's ±2.6%".
	* DRIFT — total return over the window, compared against what pure luck could
	produce (sigma * sqrt(n)), stated plainly.

	Data: yfinance (Yahoo Finance scrape — free, keyless). News: yfinance's news feed,
	also keyless. Both can rate-limit; failures are reported, never faked.
	"""

	import time
	import numpy as np
	from clutch import Clutch, MagnitudeGate
	from change import detect

	# ------------------------------------------------------------------ data (keyless)
	_CACHE = {}
	_TTL = 900 # 15 min


	def fetch_prices(ticker, period="1y"):
	"""Returns (dates, close, currency, err). Cached to be polite to Yahoo."""
	key = (ticker.upper().strip(), period, int(time.time() // _TTL))
	if key in _CACHE:
	return _CACHE[key]
	try:
	import yfinance as yf
	tk = yf.Ticker(ticker.strip())
	hist = tk.history(period=period, interval="1d", auto_adjust=True)
	if hist is None or len(hist) < 40 or "Close" not in hist:
	out = (None, None, "", f"Couldn't get enough daily data for '{ticker}'. "
	"Check the symbol (Yahoo format, e.g. AAPL, NOK, BTC-USD, ^GSPC).")
	else:
	close = hist["Close"].to_numpy(dtype=float)
	dates = [d.strftime("%Y-%m-%d") for d in hist.index]
	cur = ""
	try:
	cur = tk.fast_info.get("currency") or ""
	except Exception:
	pass
	out = (dates, close, cur, None)
	except Exception as e:
	out = (None, None, "", f"Data fetch failed ({type(e).__name__}). Yahoo sometimes "
	"rate-limits shared servers — wait a minute and try again.")
	_CACHE[key] = out
	return out


	def fetch_news(ticker, k=6):
	"""Free Yahoo headlines via yfinance; tolerant of old and new item formats."""
	try:
	import yfinance as yf
	raw = yf.Ticker(ticker.strip()).news or []
	except Exception:
	return []
	return parse_news(raw, k)


	def parse_news(raw, k=6):
	items = []
	for it in raw[: k * 2]:
	c = it.get("content", it) if isinstance(it, dict) else {}
	title = c.get("title") or it.get("title")
	if not title:
	continue
	url = ""
	cu = c.get("canonicalUrl") or c.get("clickThroughUrl") or {}
	if isinstance(cu, dict):
	url = cu.get("url", "")
	url = url or it.get("link", "")
	prov = c.get("provider") or {}
	publisher = (prov.get("displayName") if isinstance(prov, dict) else None) \
	or it.get("publisher", "")
	when = c.get("pubDate") or c.get("displayTime") or ""
	if not when and it.get("providerPublishTime"):
	when = time.strftime("%Y-%m-%d", time.gmtime(it["providerPublishTime"]))
	when = str(when)[:10]
	items.append(dict(title=title.strip(), url=url, publisher=publisher, when=when))
	if len(items) >= k:
	break
	return items


	# ------------------------------------------------------------------ analysis
	def robust_sigma(x):
	return float(1.4826 * np.median(np.abs(x - np.median(x))) + 1e-12)


	def local_sigma(rets, win=60, warm=20):
	"""Past-only rolling robust sigma, so a rough regime stops spamming shock flags
	but a fresh crash (judged against the calm past) still screams."""
	g = robust_sigma(rets)
	out = np.full(len(rets), g)
	for i in range(warm, len(rets)):
	out[i] = max(robust_sigma(rets[max(0, i - win):i]), 0.4 * g)
	return out


	def shock_events(rets, sensitivity=1.0):
	"""Clutch gate on \|return\| / local typical move. A single outsized day trips it
	instantly; several stressed days in a row accumulate and trip it too.
	Returns (events, sig_global, calm_days)."""
	sig = robust_sigma(rets)
	loc = local_sigma(rets)
	gate = MagnitudeGate(gain=3.0, leak=3.2, trip=8.0 * sensitivity)
	trips = []
	for i, r in enumerate(rets):
	if gate.update(abs(r) / loc[i]):
	trips.append(i)
	gate.clear()
	events = []
	for i in trips:
	if events and i - events[-1][-1] <= 3:
	events[-1].append(i)
	else:
	events.append([i])
	out = []
	for grp in events:
	i0 = max(0, grp[0] - 2)
	i1 = min(len(rets) - 1, grp[-1])
	cum = float(np.sum(rets[i0:i1 + 1]))
	peak_i = i0 + int(np.argmax(np.abs(rets[i0:i1 + 1])))
	peak = float(np.abs(rets[peak_i]) / loc[peak_i])
	biggest = float(rets[peak_i])
	out.append(dict(i0=i0, i1=i1, cum_ret=cum, peak_z=peak, biggest=biggest))
	calm = len(rets) - sum(e["i1"] - e["i0"] + 1 for e in out)
	return out, sig, calm


	def vol_regimes(rets, sensitivity=1.0, win=15):
	"""Non-overlapping window vols + strongest-split ratio test (near-independent
	samples, unlike a rolling window). Reports at most one regime change — the
	strongest — per period. Returns [] or [dict(at, before, after, ratio)]."""
	n = len(rets)
	m = n // win
	if m < 8:
	return []
	v = np.array([robust_sigma(rets[k * win:(k + 1) * win]) for k in range(m)])
	best = None
	for k in range(3, m - 2):
	before, after = float(np.median(v[:k])), float(np.median(v[k:]))
	ratio = after / (before + 1e-12)
	score = max(ratio, 1.0 / ratio)
	if best is None or score > best[0]:
	best = (score, k, before, after, ratio)
	score, k, before, after, ratio = best
	thresh = 1.0 + 0.75 * sensitivity # sens 1 -> 1.75x; strict 1.5 -> ~2.1x; eager 0.7 -> ~1.5x
	if score < thresh:
	return []
	# refine the change day: best day-level split within +/-2 windows of the coarse one
	c0 = k * win
	best_c, best_dev = c0, 0.0
	for c in range(max(30, c0 - 2 * win), min(n - 30, c0 + 2 * win)):
	b = robust_sigma(rets[max(0, c - 60):c])
	a = robust_sigma(rets[c:c + 60])
	dev = abs(np.log(a / (b + 1e-12) + 1e-12))
	if dev > best_dev:
	best_dev, best_c = dev, c
	before = robust_sigma(rets[max(0, best_c - 60):best_c])
	after = robust_sigma(rets[best_c:best_c + 60])
	return [dict(at=best_c, before=before, after=after, ratio=after / (before + 1e-12))]


	def analyze(dates, close, sensitivity=1.0):
	logp = np.log(np.asarray(close, float))
	rets = np.diff(logp)
	shocks, sig_d, calm = shock_events(rets, sensitivity)
	vols = vol_regimes(rets, sensitivity)
	total = float(logp[-1] - logp[0])
	luck2 = 2.0 * sig_d * np.sqrt(len(rets)) # 2-sigma of pure-luck drift
	return dict(rets=rets, sig_d=sig_d, shocks=shocks, vols=vols, calm=calm,
	total=total, luck2=luck2, n=len(rets))


	# ------------------------------------------------------------------ language
	def pct(x):
	return f"{(np.exp(x) - 1) * 100:+.1f}%"


	def verdict_md(ticker, dates, close, a, currency=""):
	n = a["n"]
	d0, d1 = dates[0], dates[-1]
	sig_pct = (np.exp(a["sig_d"]) - 1) * 100
	lines = []
	if not a["shocks"] and not a["vols"]:
	lines.append(f"## 😌 {ticker}: a quiet stretch — ordinary wobble only")
	lines.append(f"Across {n} trading days ({d0} → {d1}), no day or cluster of days "
	f"broke out of this stock's normal movement (a typical day here is about "
	f"±{sig_pct:.1f}%). Every scary-looking dip in this window was "
	f"within what dice would produce.")
	else:
	k = len(a["shocks"]) + len(a["vols"])
	lines.append(f"## 🔔 {ticker}: {k} real event{'s' if k != 1 else ''} in this window")
	ranked = sorted(a["shocks"],
	key=lambda e: max(e["peak_z"], abs(e["cum_ret"]) / (a["sig_d"] + 1e-12)),
	reverse=True)
	hidden = max(0, len(ranked) - 5)
	for e in sorted(ranked[:5], key=lambda e: e["i0"]):
	day0, day1 = dates[e["i0"] + 1], dates[e["i1"] + 1]
	span = f"on {day1}" if e["i0"] == e["i1"] else f"over {day0} → {day1}"
	if abs(e["cum_ret"]) < 0.5 * abs(e["biggest"]):
	lines.append(f"- Violent swings {span} that largely cancelled out "
	f"(net {pct(e['cum_ret'])}, sharpest single day {pct(e['biggest'])}, "
	f"about {e['peak_z']:.0f}× normal). Something happened there even "
	f"though the price ended near where it started.")
	else:
	direction = "down" if e["cum_ret"] < 0 else "up"
	lines.append(f"- Shock {span}: moved {direction} {pct(e['cum_ret'])} "
	f"(sharpest day about {e['peak_z']:.0f}× a normal day). That is a "
	f"real event, not wobble — worth knowing why (headlines below).")
	if hidden:
	lines.append(f"- (+ {hidden} smaller flare-up{'s' if hidden > 1 else ''} not "
	f"listed — nothing above {ranked[5]['peak_z']:.0f}× normal.)")
	for v in a["vols"]:
	day = dates[min(v["at"] + 1, len(dates) - 1)]
	b = (np.exp(v["before"]) - 1) * 100
	af = (np.exp(v["after"]) - 1) * 100
	word = "rougher" if af > b else "calmer"
	lines.append(f"- The ride got {word} around {day}: a typical day went from "
	f"about ±{b:.1f}% to ±{af:.1f}%. Same stock, different weather.")
	# drift vs luck — the part people get wrong most
	tot, luck = a["total"], a["luck2"]
	lines.append("")
	if abs(tot) > luck:
	lines.append(f"The drift is real too: {pct(tot)} over the period — more than the "
	f"±{(np.exp(luck)-1)*100:.0f}% that pure day-to-day luck could plausibly "
	f"produce over {n} days.")
	else:
	lines.append(f"About the overall {pct(tot)} move: over {n} days, pure luck at this "
	f"stock's wobble could produce anything within about "
	f"±{(np.exp(luck)-1)*100:.0f}%. So the period's drift, by itself, is "
	f"not distinguishable from chance — an honest thing almost no chart "
	f"commentary will tell you.")
	lines.append("")
	lines.append(f"Your attention, saved: {a['calm']} of {n} days were inside the normal "
	f"band — days when checking the chart could tell you nothing.")
	lines.append("")
	lines.append("<small>This describes what already happened in free Yahoo data; it predicts "
	"nothing and is not investment advice or a recommendation to buy or sell "
	"anything. Past shocks say nothing about future ones.</small>")
	return "\n".join(lines)