grc-iit
/

FunctionGemma-ndp

function-calling

Model card Files Files and versions

shazzadulimun commited on 4 days ago

Commit

55e313c

·

verified ·

1 Parent(s): 057dde7

Add live-MCP test code block

Files changed (1) hide show

README.md +74 -0

README.md CHANGED Viewed

@@ -49,6 +49,80 @@ Output format is FunctionGemma native:
 <start_function_call>call:list_organizations{server:<escape>global<escape>}<end_function_call>
 ```
 ## Files
 - `merged_16bit/` — full safetensors checkpoint

 <start_function_call>call:list_organizations{server:<escape>global<escape>}<end_function_call>
 ```
+## Live test against the upstream NDP MCP
+End-to-end: model → tool call → upstream `clio-kit` NDP MCP → real NDP response.
+```python
+# /// script
+# requires-python = ">=3.11"
+# dependencies = [
+#   "transformers>=4.45", "torch>=2.4", "accelerate>=0.34",
+#   "sentencepiece>=0.2", "protobuf>=4", "mcp>=1.0",
+# ]
+# ///
+import asyncio, json, re
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from mcp import ClientSession, StdioServerParameters
+from mcp.client.stdio import stdio_client
+MID = "shazzadulimun/FunctionGemma-ndp"
+PROMPT = "List all organizations on the NDP global server"
+# 14-tool NDP catalog reshaped as OpenAI function specs (truncated here).
+tools = [{"type": "function", "function": {
+    "name": "list_organizations",
+    "description": "List organizations available in the National Data Platform.",
+    "parameters": {"type": "object", "properties": {
+        "name_filter": {"type": "string"}, "server": {"type": "string"},
+    }, "required": []},
+}}]
+tok = AutoTokenizer.from_pretrained(MID, subfolder="merged_16bit")
+mdl = AutoModelForCausalLM.from_pretrained(
+    MID, subfolder="merged_16bit", dtype=torch.bfloat16, device_map="auto",
+)
+text = tok.apply_chat_template(
+    [{"role": "user", "content": PROMPT}],
+    tools=tools, add_generation_prompt=True, tokenize=False,
+)
+inp = tok(text, return_tensors="pt").to(mdl.device)
+out = mdl.generate(**inp, max_new_tokens=300)
+raw = tok.decode(out[0][inp.input_ids.shape[-1]:], skip_special_tokens=False)
+# Parse FunctionGemma format: <start_function_call>call:NAME{k:v,...}<end_function_call>
+m = re.search(r"<start_function_call>\s*call:(\w+)\s*\{(.*?)\}\s*<end_function_call>",
+              raw, re.DOTALL)
+name = m.group(1)
+args = {}
+for k, v in re.findall(r"(\w+)\s*:\s*(<escape>.*?<escape>|None|\w+)", m.group(2)):
+    if v == "None":
+        continue                                      # strip phantom nulls
+    args[k] = re.sub(r"<escape>|<escape>", "", v) if "<escape>" in v else v
+# Spawn the upstream clio-kit NDP MCP and call the parsed tool against it.
+async def call():
+    params = StdioServerParameters(command="uvx", args=[
+        "--from",
+        "git+https://github.com/iowarp/clio-kit.git#subdirectory=clio-kit-mcp-servers/ndp",
+        "ndp-mcp",
+    ])
+    async with stdio_client(params) as (r, w):
+        async with ClientSession(r, w) as s:
+            await s.initialize()
+            out = await s.call_tool(name, args)
+            print("".join(c.text for c in out.content if hasattr(c, "text")))
+asyncio.run(call())
+```
+Save as `test.py` and run:
+```bash
+uv run --isolated test.py
+```
 ## Files
 - `merged_16bit/` — full safetensors checkpoint