| python -m reframr serve --model model.safetensors --max-tokens 120 | |
| # Example requests to paste into the JSONL server: | |
| # {"system":"Answer like a deployment lead. Be direct and source-grounded.","prompt":"Draft a rollback plan for a payments API release.","temperature":0.58,"decode_top_k":64,"max_tokens":180} | |
| # {"prompt":"Who won the Rivergate mayoral runoff?","tool_results":[{"name":"web.search","ok":true,"source":{"title":"Local Civic Wire","url":"https://example.org/rivergate-runoff","snippet":"Mara Ibekwe won the Rivergate mayoral runoff with 52.4 percent of the vote."}}],"max_tokens":80} | |