File size: 17,999 Bytes
37cb069
470bcea
37cb069
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
470bcea
 
 
 
37cb069
 
470bcea
 
37cb069
 
 
 
 
 
 
470bcea
 
 
37cb069
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
 
 
37cb069
 
 
470bcea
37cb069
 
 
 
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
470bcea
 
 
37cb069
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
470bcea
 
 
 
 
 
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
470bcea
37cb069
 
 
 
 
470bcea
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
 
 
 
37cb069
470bcea
 
 
37cb069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
470bcea
37cb069
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
#!/usr/bin/env python3
"""ICSAC Editorial System β€” workflow entry point."""

import argparse
import sys

import config
import submission_intake
import review
import notify
import action
import email_render
import email_send


def fire_pain(title, message):
    """Send pain signal to the operator's monitoring endpoint. Best-effort, never raises."""
    url = getattr(config, "NTFY_PAIN_URL", "")
    if not url:
        return
    import urllib.request
    try:
        req = urllib.request.Request(url, data=message.encode())
        req.add_header("Title", title)
        urllib.request.urlopen(req, timeout=5)
    except Exception:
        pass


def fire_brain(domain, sigtype, source, metric, value=1):
    """Push a brain signal. Best-effort, never raises."""
    url = getattr(config, "BRAIN_URL", "")
    if not url:
        return
    import urllib.request, json
    try:
        title = f"{domain}|{sigtype}|{source}|{metric}"
        req = urllib.request.Request(
            url,
            data=json.dumps({"value": value}).encode(),
        )
        req.add_header("Title", title)
        req.add_header("Content-Type", "application/json")
        urllib.request.urlopen(req, timeout=5)
    except Exception:
        pass


def fire_heartbeat(status="up", msg="OK"):
    """Push heartbeat to Uptime Kuma. Best-effort, never raises.

    Call from successful poll runs only β€” confirms the scheduled service ran
    end to end. Manual review invocations should NOT fire this (they'd create
    false 'all healthy' signals between scheduled polls).
    """
    base = getattr(config, "KUMA_PUSH_URL", "")
    if not base:
        return
    import urllib.request, urllib.parse
    try:
        params = urllib.parse.urlencode({"status": status, "msg": msg, "ping": ""})
        urllib.request.urlopen(f"{base}?{params}", timeout=5)
    except Exception:
        pass


def check_model_availability(timeout: int = 15) -> dict:
    """Fetch OR's live free-tier catalog and report per-configured-slot reachability.

    Returns a structured dict so both the CLI (refresh-models) and the batch
    tick scheduler can share one implementation. A slot is 'dead' when
    EVERY entry in its fallback chain is missing from the live catalog β€”
    OpenRouter's intra-slot fallback cannot rescue a fully-missing chain.

    Errors fetching the catalog surface as fetched=False; batch-tick treats
    this the same as a dead slot (can't confirm reachability β†’ skip reviews).
    """
    import urllib.request, json as _json

    url = getattr(config, "OPENROUTER_MODELS_API_URL",
                  "https://openrouter.ai/api/v1/models")
    try:
        with urllib.request.urlopen(url, timeout=timeout) as resp:
            data = _json.loads(resp.read().decode())
    except Exception as e:
        return {
            "fetched": False,
            "error": str(e),
            "free_models": [],
            "slots": [],
            "any_slot_dead": True,
        }

    free = [m for m in data.get("data", []) if m.get("id", "").endswith(":free")]
    free_ids = {m["id"] for m in free}
    free.sort(key=lambda m: -m.get("context_length", 0))

    slots_info = []
    for i, slot in enumerate(getattr(config, "OPENROUTER_MODELS", []), 1):
        chain = list(slot) if isinstance(slot, list) else [slot]
        reachable = [m for m in chain if m in free_ids]
        missing = [m for m in chain if m not in free_ids]
        slots_info.append({
            "index": i,
            "chain": chain,
            "reachable": reachable,
            "missing": missing,
            "dead": len(reachable) == 0,
        })

    return {
        "fetched": True,
        "free_models": free,
        "slots": slots_info,
        "any_slot_dead": any(s["dead"] for s in slots_info),
    }


def review_doi(doi: str, skip_notify: bool = False) -> dict:
    """Run the full review pipeline for a single DOI."""
    print(f"\n{'='*60}")
    print(f"Processing: {doi}")
    print(f"{'='*60}")

    # Ingest
    print("\n[1/3] Ingesting from Zenodo...")
    try:
        review_data = submission_intake.ingest_doi(doi)
    except Exception as e:
        print(f"  FAILED: {e}")
        return {"doi": doi, "error": str(e)}

    print(f"  Title: {review_data['title']}")
    print(f"  Authors: {', '.join(review._creator_display_names(review_data.get('creators')))}")
    pdf_status = "downloaded" if review_data.get("pdf_path") else "not available"
    print(f"  PDF: {pdf_status}")

    full_text_len = len(review_data.get("full_text", ""))
    if review_data.get("pdf_path") and full_text_len < submission_intake.PDF_TEXT_MIN_CHARS:
        msg = (
            f"PDF has no usable text layer ({full_text_len} chars extracted). "
            f"ICSAC requires text-layer PDFs β€” image-only scans and "
            f"raster-print deposits are not reviewed. Submitter must upload "
            f"a text-layer version."
        )
        print(f"  FAILED: {msg}")
        fire_pain(
            "ICSAC Pipeline: PDF requires text layer",
            f"{doi}: {review_data.get('title', '')[:120]}\n{msg}",
        )
        return {"doi": doi, "error": msg}

    # Review
    print("\n[2/3] Running reviewer panel...")
    try:
        markdown, aggregate = review.review_paper(review_data)
    except Exception as e:
        print(f"  FAILED: {e}")
        return {"doi": doi, "error": str(e)}

    rec = aggregate.get("recommendation", "REVIEW_FURTHER")
    print(f"  Recommendation: {rec}")
    print(f"  Disagreement: {aggregate.get('disagreement', False)}")

    # Notify
    if not skip_notify:
        print("\n[3/3] Sending notifications...")
        try:
            notify.notify_review_complete(review_data, aggregate)
            print("  Notifications sent.")
        except Exception as e:
            print(f"  Notification error (non-fatal): {e}")
    else:
        print("\n[3/3] Notifications skipped.")

    fire_brain("business", "reward", "editorial_system", "review_completed", 1)
    if rec == "RECOMMEND":
        fire_brain("business", "event", "editorial_system", "recommend", 1)
    elif rec == "REVISE_AND_RESUBMIT":
        fire_brain("business", "event", "editorial_system", "revise_and_resubmit", 1)
    elif rec == "REJECT":
        fire_brain("business", "event", "editorial_system", "reject", 1)

    return {
        "doi": doi,
        "title": review_data["title"],
        "recommendation": rec,
        "disagreement": aggregate.get("disagreement", False),
    }


def poll_community() -> None:
    """Poll for pending community requests and review them."""
    print("\nPolling ICSAC community requests...")
    requests = action.get_community_requests()

    if not requests:
        print("  No pending requests.")
        fire_heartbeat("up", "poll ok, 0 pending")
        return

    print(f"  Found {len(requests)} request(s).")
    fire_brain("business", "state", "editorial_system", "pending_requests", len(requests))
    for req in requests:
        topic = req.get("topic", {})
        record = topic.get("record", "")
        status = req.get("status", "")
        print(f"  - Request {req.get('id')}: record={record} status={status}")

    fire_heartbeat("up", f"poll ok, {len(requests)} pending")


def main():
    parser = argparse.ArgumentParser(
        description="ICSAC Open Review Pipeline"
    )
    sub = parser.add_subparsers(dest="command")

    # review command
    rev = sub.add_parser("review", help="Review one or more DOIs")
    rev.add_argument("dois", nargs="+", help="DOI(s) to review")
    rev.add_argument("--skip-notify", action="store_true", help="Skip notifications")

    # poll command
    sub.add_parser("poll", help="Poll community for pending requests")

    # requests command
    sub.add_parser("requests", help="List pending community requests")

    # accept/reject commands
    acc = sub.add_parser("accept", help="Accept a community request")
    acc.add_argument("request_id", help="Request ID to accept")
    acc.add_argument("--comment", default="", help="Comment for acceptance")

    rej = sub.add_parser("reject", help="Reject a community request")
    rej.add_argument("request_id", help="Request ID to reject")
    rej.add_argument("--comment", default="", help="Comment for rejection")

    sub.add_parser("watch-tick", help="Run one watcher cycle: detect transitions, fire side effects")
    sub.add_parser("watch-bootstrap", help="Seed state from current Zenodo state without firing side effects (run once on install)")

    refresh = sub.add_parser("refresh-models", help="Print currently-working free models from OpenRouter live API")
    refresh.add_argument("--check-exit", action="store_true",
                         help="Exit 2 if any configured slot has no reachable model (for cron health checks)")

    sub.add_parser("batch-tick", help="Run the twice-daily batch workflow: model check + watch-tick + summary")

    em = sub.add_parser("email", help="Render and (optionally) send accept / revise-and-resubmit / reject / invite emails")
    em.add_argument("kind", choices=["accept", "revise-and-resubmit", "reject", "invite"],
                    help=("accept = sends accept + community invite; "
                          "revise-and-resubmit = default decline path (engageable in-scope work); "
                          "reject = woo template (scope-not-suitable / pseudoscience only β€” NOT the standard decline path); "
                          "invite = resend invite only"))
    em.add_argument("doi", help="Zenodo DOI of the paper")
    em.add_argument("to", help="Recipient email address")
    em.add_argument("--send", action="store_true", help="Actually send (default: dry-run preview)")

    args = parser.parse_args()

    if args.command == "review":
        results = []
        for doi in args.dois:
            result = review_doi(doi, skip_notify=args.skip_notify)
            results.append(result)

        print(f"\n{'='*60}")
        print("BATCH SUMMARY")
        print(f"{'='*60}")
        for r in results:
            status = r.get("recommendation", r.get("error", "UNKNOWN"))
            print(f"  {r['doi']}: {status}")

    elif args.command == "poll":
        poll_community()

    elif args.command == "requests":
        requests = action.get_community_requests()
        for r in requests:
            print(f"  ID: {r.get('id')}  Status: {r.get('status')}")

    elif args.command == "accept":
        ok = action.accept_request(args.request_id, args.comment)
        print("Accepted." if ok else "Failed.")

    elif args.command == "reject":
        ok = action.reject_request(args.request_id, args.comment)
        print("Rejected." if ok else "Failed.")

    elif args.command == "refresh-models":
        result = check_model_availability()
        if not result["fetched"]:
            print(f"Failed to fetch models: {result.get('error', 'unknown')}")
            sys.exit(1)
        free = result["free_models"]
        print(f"\n=== {len(free)} FREE MODELS (live from OpenRouter) ===\n")
        print(f"{'MODEL':<60s} {'CTX':>10s}")
        print("-" * 75)
        for m in free:
            print(f"{m['id']:<60s} {m.get('context_length', 0):>10d}")
        print(f"\nCurrently configured slots:")
        for slot in result["slots"]:
            print(f"  Slot {slot['index']}: {' -> '.join(slot['chain'])}")
            for m in slot["chain"]:
                marker = "OK" if m in slot["reachable"] else "MISSING from free list"
                print(f"           {m}: {marker}")
            if slot["dead"]:
                print(f"           !! SLOT {slot['index']} IS DEAD (every fallback missing)")
        if args.check_exit and result["any_slot_dead"]:
            sys.exit(2)
        sys.exit(0)

    elif args.command == "batch-tick":
        import watch
        import notify
        import publish_watcher

        print("== ICSAC Batch Tick ==")
        print("[1/4] Checking OR model availability...")
        mod = check_model_availability()
        skip_reviews = False
        if not mod["fetched"]:
            print(f"  catalog fetch failed: {mod.get('error')}")
            skip_reviews = True
        else:
            dead = [s for s in mod["slots"] if s["dead"]]
            if dead:
                for s in dead:
                    print(f"  SLOT {s['index']} DEAD β€” chain {s['chain']} all missing")
                skip_reviews = True
            else:
                print(f"  all {len(mod['slots'])} OR slots have >=1 reachable model")

        if skip_reviews:
            dead_slots = [s["index"] for s in mod.get("slots", []) if s["dead"]]
            fire_pain(
                "ICSAC Batch Tick: review step skipped",
                (
                    f"OR model availability check failed (fetched={mod['fetched']}, "
                    f"dead_slots={dead_slots}). State transitions still handled; "
                    f"new submissions tracked but not reviewed until next healthy tick."
                ),
            )

        print(f"[2/4] Running watch tick (skip_reviews={skip_reviews})...")
        import sys as _sys
        _sys.argv = ["watch"] + (["--skip-reviews"] if skip_reviews else [])
        rc = watch.main()

        print("[3/4] Polling staged Zenodo drafts for publish transitions...")
        try:
            publish_summary = publish_watcher.poll_drafts()
            print(
                f"  publish_watcher: checked={publish_summary['checked']} "
                f"published={publish_summary['published']} "
                f"still_draft={publish_summary['still_draft']} "
                f"errors={publish_summary['errors']}"
            )
        except Exception as e:
            print(f"  publish_watcher crashed (non-fatal): {e}")
            publish_summary = {"checked": 0, "published": 0,
                               "still_draft": 0, "errors": 1,
                               "transitions": []}

        print("[4/4] Summary curator alert...")
        try:
            dead_slots = [s["index"] for s in mod.get("slots", []) if s["dead"]]
            if mod["fetched"]:
                model_status = (
                    f"{len(mod['slots']) - len(dead_slots)}/{len(mod['slots'])} OR slots live"
                    + (f" (dead: {dead_slots})" if dead_slots else "")
                )
            else:
                model_status = f"catalog fetch failed: {mod.get('error', 'unknown')[:80]}"
            publish_line = (
                f"Publish-watcher: {publish_summary['published']} new, "
                f"{publish_summary['still_draft']} still draft, "
                f"{publish_summary['errors']} errors"
            )
            if publish_summary["transitions"]:
                publish_line += f" β€” {', '.join(publish_summary['transitions'])}"
            msg = (
                f"ICSAC Batch Tick complete\n\n"
                f"Models: {model_status}\n"
                f"Reviews: {'SKIPPED (starved panel)' if skip_reviews else 'ran'}\n"
                f"Watch tick exit: {rc}\n"
                f"{publish_line}\n\n"
                f"Transitions (accept/decline) always run regardless of model state."
            )
            notify.send_to_curator(msg, parse_mode=None)
        except Exception as e:
            print(f"  summary curator alert failed (non-fatal): {e}")

        sys.exit(rc)

    elif args.command == "email":
        import time
        review_data = submission_intake.ingest_doi(args.doi)

        def _deliver(label: str, rendered: str, send_fn) -> bool:
            print(f"\n=== {label} ===")
            print(rendered)
            ok, msg = send_fn(args.to, rendered, send=args.send)
            print("=== DELIVERY ===")
            print(("OK" if ok else "FAIL") + ": " + msg)
            return ok

        if args.kind == "accept":
            ok1 = _deliver("EMAIL 1/2 β€” ACCEPT",
                           email_render.render_accept_email(review_data),
                           email_send.send_accept_email)
            if not ok1:
                if not args.send:
                    print("\n(dry-run; pass --send to actually deliver)")
                sys.exit(1)
            if args.send:
                time.sleep(5)
            ok2 = _deliver("EMAIL 2/2 β€” COMMUNITY INVITE",
                           email_render.render_community_invite_email(review_data),
                           email_send.send_invite_email)
            if not args.send:
                print("\n(dry-run; pass --send to actually deliver both)")
            sys.exit(0 if (ok1 and ok2) else 1)
        elif args.kind == "revise-and-resubmit":
            ok = _deliver("REVISE-AND-RESUBMIT EMAIL",
                          email_render.render_revise_and_resubmit_email(review_data),
                          email_send.send_revise_and_resubmit_email)
        elif args.kind == "reject":
            ok = _deliver("SCOPE-REJECT EMAIL (scope-not-suitable)",
                          email_render.render_scope_reject_email(review_data),
                          email_send.send_scope_reject_email)
        else:  # invite
            ok = _deliver("COMMUNITY INVITE",
                          email_render.render_community_invite_email(review_data),
                          email_send.send_invite_email)
        if not args.send:
            print("\n(dry-run; pass --send to actually deliver)")
        sys.exit(0 if ok else 1)

    elif args.command == "watch-tick":
        import watch
        sys.exit(watch.main())

    elif args.command == "watch-bootstrap":
        import watch
        sys.argv = ["watch", "--bootstrap"]
        sys.exit(watch.main())

    else:
        parser.print_help()
        sys.exit(1)


if __name__ == "__main__":
    try:
        main()
    except KeyboardInterrupt:
        sys.exit(130)
    except Exception as exc:
        fire_pain(
            "editorial-system failed",
            f"Pipeline crashed: {type(exc).__name__}: {exc}",
        )
        raise