Instructions to use my-ai-stack/Stack-2-9-finetuned with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use my-ai-stack/Stack-2-9-finetuned with Transformers:

# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-generation", model="my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
pipe(messages)

# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
model = AutoModelForCausalLM.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
inputs = tokenizer.apply_chat_template(
	messages,
	add_generation_prompt=True,
	tokenize=True,
	return_dict=True,
	return_tensors="pt",
).to(model.device)

outputs = model.generate(**inputs, max_new_tokens=40)
print(tokenizer.decode(outputs[0][inputs["input_ids"].shape[-1]:]))

Notebooks
Google Colab
Kaggle
Local Apps

vLLM

How to use my-ai-stack/Stack-2-9-finetuned with vLLM:

Install from pip and serve model

# Install vLLM from pip:
pip install vllm
# Start the vLLM server:
vllm serve "my-ai-stack/Stack-2-9-finetuned"
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:8000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker

docker model run hf.co/my-ai-stack/Stack-2-9-finetuned

SGLang

How to use my-ai-stack/Stack-2-9-finetuned with SGLang:

Install from pip and serve model

# Install SGLang from pip:
pip install sglang
# Start the SGLang server:
python3 -m sglang.launch_server \
    --model-path "my-ai-stack/Stack-2-9-finetuned" \
    --host 0.0.0.0 \
    --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker images

docker run --gpus all \
    --shm-size 32g \
    -p 30000:30000 \
    -v ~/.cache/huggingface:/root/.cache/huggingface \
    --env "HF_TOKEN=<secret>" \
    --ipc=host \
    lmsysorg/sglang:latest \
    python3 -m sglang.launch_server \
        --model-path "my-ai-stack/Stack-2-9-finetuned" \
        --host 0.0.0.0 \
        --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Docker Model Runner
How to use my-ai-stack/Stack-2-9-finetuned with Docker Model Runner:
```
docker model run hf.co/my-ai-stack/Stack-2-9-finetuned
```

Stack-2-9-finetuned / src /cli /agent.py

walidsobhie-code

refactor: Clean up project structure - fewer root folders

99a7be2 about 2 months ago

raw

history blame

18.9 kB

	#!/usr/bin/env python3
	"""
	Stack 2.9 - Core Agent Logic Module
	Query understanding, tool selection, response generation, and self-reflection loop.
	"""

	import os
	import json
	import re
	import asyncio
	from pathlib import Path
	from typing import Any, Dict, List, Optional, Union, Callable
	from dataclasses import dataclass, field
	from datetime import datetime
	from enum import Enum

	from .tools import TOOLS, get_tool, list_tools, get_tool_schemas
	from .context import ContextManager, create_context_manager


	class QueryIntent(Enum):
	"""Intents recognized by the agent."""
	FILE_READ = "file_read"
	FILE_WRITE = "file_write"
	FILE_EDIT = "file_edit"
	FILE_SEARCH = "file_search"
	GIT_OPERATION = "git_operation"
	CODE_EXECUTION = "code_execution"
	WEB_SEARCH = "web_search"
	MEMORY = "memory"
	TASK = "task"
	QUESTION = "question"
	GENERAL = "general"


	@dataclass
	class ToolCall:
	"""Represents a tool call."""
	tool_name: str
	arguments: Dict[str, Any]
	result: Optional[Dict[str, Any]] = None
	success: bool = False
	error: Optional[str] = None


	@dataclass
	class AgentResponse:
	"""Represents the agent's response."""
	content: str
	tool_calls: List[ToolCall] = field(default_factory=list)
	context_used: List[str] = field(default_factory=list)
	confidence: float = 1.0
	needs_clarification: bool = False
	clarification_needed: Optional[str] = None


	class QueryUnderstanding:
	"""Understands user queries and maps them to intents and tools."""

	# Intent patterns
	PATTERNS = {
	QueryIntent.FILE_READ: [
	r"read\s+(?:the\s+)?(?:file\s+)?(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"show\s+(?:me\s+)?(?:the\s+)?(?:content\s+of\s+)?(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"what('s\| is)\s+in\s+(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"cat\s+(.+)",
	r"view\s+(.+)",
	],
	QueryIntent.FILE_WRITE: [
	r"write\s+(?:to\s+)?(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"create\s+(?:file\s+)?(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"save\s+(?:to\s+)?(.+)",
	],
	QueryIntent.FILE_EDIT: [
	r"edit\s+(.+\.py\|.+\.js\|.+\.txt\|.+\.md\|.+\.json)",
	r"modify\s+(.+)",
	r"change\s+(.+)",
	r"replace\s+(.+)",
	],
	QueryIntent.FILE_SEARCH: [
	r"find\s+(?:files?\s+)?(?:named\s+)?(.+)",
	r"search\s+for\s+(?:files?\s+)?(.+)",
	r"where\s+is\s+(.+)",
	r"locate\s+(.+)",
	],
	QueryIntent.GIT_OPERATION: [
	r"git\s+(commit\|push\|pull\|branch\|status\|log\|diff)",
	r"(commit\|push\|pull\|branch)\s+(?:to\s+)?(?:the\s+)?(?:repo\|repository)?",
	],
	QueryIntent.CODE_EXECUTION: [
	r"run\s+(?:the\s+)?(?:command\s+)?(.+)",
	r"execute\s+(.+)",
	r"start\s+(?:the\s+)?(?:server\s+)?(.+)",
	r"test\s+(?:the\s+)?(.+)",
	r"lint\s+(.+)",
	r"format\s+(.+)",
	],
	QueryIntent.WEB_SEARCH: [
	r"search\s+(?:the\s+)?web\s+for\s+(.+)",
	r"google\s+(.+)",
	r"look\s+up\s+(.+)",
	r"find\s+information\s+about\s+(.+)",
	],
	QueryIntent.MEMORY: [
	r"(remember\|recall\|what do you remember)\s+(.+)",
	r"(save\|store)\s+(?:to\s+)?memory\s+(.+)",
	r"what('s\| is)\s+in\s+(?:the\s+)?memory",
	],
	QueryIntent.TASK: [
	r"(create\|add\|new)\s+task\s+(.+)",
	r"list\s+(?:my\s+)?tasks?",
	r"(complete\|finish\|done)\s+task\s+(.+)",
	],
	QueryIntent.QUESTION: [
	r"what\s+is\s+(.+)",
	r"how\s+(?:do\|does)\s+(.+)",
	r"why\s+(.+)",
	r"can\s+(.+)",
	r"(?:help\|explain)\s+(.+)",
	],
	}

	def __init__(self):
	self.tools = list_tools()

	def parse(self, query: str) -> Dict[str, Any]:
	"""Parse query and determine intent."""
	query = query.strip().lower()

	# Check each intent pattern
	for intent, patterns in self.PATTERNS.items():
	for pattern in patterns:
	match = re.search(pattern, query, re.IGNORECASE)
	if match:
	return {
	"intent": intent.value,
	"matched": match.group(0),
	"extracted": match.groups() if match.groups() else None,
	"confidence": 0.8
	}

	return {
	"intent": QueryIntent.GENERAL.value,
	"matched": None,
	"extracted": None,
	"confidence": 0.5
	}

	def extract_file_path(self, text: str) -> Optional[str]:
	"""Extract file path from text."""
	# Common patterns for file paths
	patterns = [
	r"([a-zA-Z0-9_/\-\.]+\.py)",
	r"([a-zA-Z0-9_/\-\.]+\.js)",
	r"([a-zA-Z0-9_/\-\.]+\.ts)",
	r"([a-zA-Z0-9_/\-\.]+\.md)",
	r"([a-zA-Z0-9_/\-\.]+\.json)",
	r"([a-zA-Z0-9_/\-\.]+\.txt)",
	r"([a-zA-Z0-9_/\-\.]+\.yaml\|\.yml)",
	r"([a-zA-Z0-9_/\-\.]+)",
	]

	for pattern in patterns:
	match = re.search(pattern, text)
	if match:
	return match.group(1)

	return None


	class ToolSelector:
	"""Selects appropriate tools based on query intent."""

	# Intent to tool mapping
	INTENT_TOOLS = {
	QueryIntent.FILE_READ: ["read"],
	QueryIntent.FILE_WRITE: ["write"],
	QueryIntent.FILE_EDIT: ["edit"],
	QueryIntent.FILE_SEARCH: ["search", "grep"],
	QueryIntent.GIT_OPERATION: ["git_status", "git_commit", "git_push", "git_pull", "git_branch", "git_log"],
	QueryIntent.CODE_EXECUTION: ["run", "test", "lint", "format"],
	QueryIntent.WEB_SEARCH: ["web_search", "fetch"],
	QueryIntent.MEMORY: ["memory_recall", "memory_save", "memory_list"],
	QueryIntent.TASK: ["create_task", "list_tasks", "update_task"],
	}

	def select(self, intent: str, context: Dict[str, Any]) -> List[str]:
	"""Select tools for given intent."""
	tools = []

	try:
	intent_enum = QueryIntent(intent)
	tools = self.INTENT_TOOLS.get(intent_enum, [])
	except ValueError:
	tools = []

	# Add general tools
	tools.extend(["run", "context_load", "project_scan"])

	return list(set(tools))

	def get_tool_parameters(self, tool_name: str, query: str, context: Dict[str, Any]) -> Dict[str, Any]:
	"""Extract parameters for a tool from query and context."""
	params = {}

	query_lower = query.lower()

	if tool_name == "read":
	path = re.search(r"(?:read\|show\|cat\|view)\s+(?:the\s+)?(?:file\s+)?(.+)", query, re.IGNORECASE)
	if path:
	params["path"] = path.group(1).strip()

	elif tool_name == "write":
	path = re.search(r"write\s+(?:to\s+)?(.+?)(?:\s+with\|\s+content\|$)", query, re.IGNORECASE)
	if path:
	params["path"] = path.group(1).strip()
	# Try to extract content
	content_match = re.search(r"(?:content\|with):\s*(.+)$", query, re.IGNORECASE)
	if content_match:
	params["content"] = content_match.group(1)

	elif tool_name == "git_commit":
	msg = re.search(r"commit(?:\s+with)?\s+(?:message\s+)?[\"']?(.+)[\"']?", query, re.IGNORECASE)
	if msg:
	params["message"] = msg.group(1).strip()

	elif tool_name == "web_search":
	# Extract search query
	patterns = [
	r"search\s+(?:the\s+)?web\s+for\s+(.+)",
	r"google\s+(.+)",
	r"look\s+up\s+(.+)",
	]
	for pattern in patterns:
	match = re.search(pattern, query, re.IGNORECASE)
	if match:
	params["query"] = match.group(1).strip()
	break

	return params


	class ResponseGenerator:
	"""Generates natural language responses."""

	def __init__(self):
	self.context_manager = create_context_manager()

	def generate(
	self,
	tool_results: List[ToolCall],
	intent: str,
	context: Dict[str, Any]
	) -> str:
	"""Generate response from tool results."""
	if not tool_results:
	return "I couldn't find any results for your query."

	responses = []

	for call in tool_results:
	if call.result is None:
	responses.append(f"I tried to use {call.tool_name} but got no result.")
	continue

	if call.result.get("success"):
	result = call.result

	# Format based on tool
	if call.tool_name == "read":
	if "content" in result:
	content = result["content"]
	if len(content) > 500:
	content = content[:500] + "..."
	responses.append(f"Here's the content:\n```\n{content}\n```")

	elif call.tool_name == "grep":
	if "matches" in result:
	matches = result["matches"]
	if matches:
	resp = f"Found {len(matches)} matches:\n"
	for m in matches[:10]:
	resp += f"- {m.get('file', '?')}:{m.get('line', '?')} - {m.get('content', '')}\n"
	responses.append(resp)
	else:
	responses.append("No matches found.")

	elif call.tool_name in ["git_status", "git_log"]:
	if "files" in result:
	files = result["files"]
	if files:
	responses.append(f"Changed files ({len(files)}):\n" + "\n".join(f" - {f}" for f in files))
	else:
	responses.append("No changes detected.")
	elif "commits" in result:
	commits = result["commits"]
	if commits:
	responses.append("Recent commits:\n" + "\n".join(f" - {c}" for c in commits[:5]))

	elif call.tool_name == "web_search":
	if "results" in result:
	results = result["results"]
	resp = "Search results:\n"
	for r in results[:5]:
	resp += f"- {r.get('title', 'Untitled')}\n"
	responses.append(resp)

	elif call.tool_name == "run":
	stdout = result.get("stdout", "")
	stderr = result.get("stderr", "")
	if stdout:
	responses.append(f"Output:\n```\n{stdout[:500]}\n```")
	if stderr:
	responses.append(f"Errors:\n```\n{stderr[:500]}\n```")
	if not stdout and not stderr:
	responses.append("Command executed successfully.")

	elif call.tool_name == "memory_recall":
	if "matches" in result:
	matches = result["matches"]
	if matches:
	responses.append(f"Found {len(matches)} memory entries.")
	else:
	responses.append("No matching memories found.")

	else:
	# Generic success response
	responses.append(f"{call.tool_name}: {json.dumps(result)[:200]}")
	else:
	error = call.result.get("error", "Unknown error")
	responses.append(f"Error in {call.tool_name}: {error}")

	return "\n\n".join(responses) or "I processed your request but have no results to show."

	def generate_clarification(self, question: str) -> str:
	"""Generate clarification question."""
	return f"I need some clarification: {question}"


	class SelfReflection:
	"""Self-reflection loop for improving responses."""

	def __init__(self):
	self.max_iterations = 3
	self.min_confidence = 0.7

	def reflect(
	self,
	query: str,
	tool_calls: List[ToolCall],
	response: str
	) -> Dict[str, Any]:
	"""Reflect on the response and determine if improvement is needed."""
	# Check if any tool call failed
	failed_calls = [c for c in tool_calls if not c.success]

	# Calculate confidence
	success_rate = len(tool_calls) / max(len(tool_calls), 1)
	confidence = success_rate

	needs_reflection = (
	len(failed_calls) > 0 or
	confidence < self.min_confidence or
	len(response) < 20
	)

	return {
	"needs_reflection": needs_reflection,
	"confidence": confidence,
	"failed_calls": len(failed_calls),
	"response_length": len(response),
	"suggestion": self._get_suggestion(failed_calls, confidence) if needs_reflection else None
	}

	def _get_suggestion(self, failed_calls: List[ToolCall], confidence: float) -> str:
	"""Get improvement suggestion."""
	if not failed_calls:
	return "Try providing more context in your query."

	return f"Failed tool calls: {', '.join(c.tool_name for c in failed_calls)}"


	class StackAgent:
	"""
	Core agent that combines all components for intelligent assistance.
	"""

	def __init__(self, workspace: Optional[str] = None):
	self.query_understanding = QueryUnderstanding()
	self.tool_selector = ToolSelector()
	self.response_generator = ResponseGenerator()
	self.self_reflection = SelfReflection()
	self.context_manager = create_context_manager(workspace)
	self.conversation_history: List[Dict[str, Any]] = []

	def process(self, query: str, context: Optional[Dict] = None) -> AgentResponse:
	"""Process a user query."""
	context = context or {}

	# Step 1: Understand query
	parsed = self.query_understanding.parse(query)
	intent = parsed["intent"]
	confidence = parsed["confidence"]

	# Step 2: Select tools
	selected_tools = self.tool_selector.select(intent, context)
	tool_params = {}

	for tool_name in selected_tools:
	tool_params[tool_name] = self.tool_selector.get_tool_parameters(tool_name, query, context)

	# Step 3: Execute tools
	tool_calls = []
	for tool_name in selected_tools:
	tool = get_tool(tool_name)
	if tool is None:
	continue

	params = tool_params.get(tool_name, {})
	try:
	result = tool(**params)
	call = ToolCall(
	tool_name=tool_name,
	arguments=params,
	result=result,
	success=result.get("success", False) if isinstance(result, dict) else True
	)
	except Exception as e:
	call = ToolCall(
	tool_name=tool_name,
	arguments=params,
	error=str(e),
	success=False
	)

	tool_calls.append(call)

	# Record in session
	self.context_manager.session.add_tool_usage(tool_name, call.result)

	# Step 4: Generate response
	response_content = self.response_generator.generate(tool_calls, intent, context)

	# Step 5: Self-reflect
	reflection = self.self_reflection.reflect(query, tool_calls, response_content)

	# Step 6: Add to conversation history
	self.conversation_history.append({
	"query": query,
	"intent": intent,
	"tool_calls": [c.tool_name for c in tool_calls],
	"response": response_content,
	"reflection": reflection,
	"timestamp": datetime.now().isoformat()
	})

	return AgentResponse(
	content=response_content,
	tool_calls=tool_calls,
	confidence=reflection.get("confidence", confidence),
	needs_clarification=reflection.get("needs_reflection", False),
	clarification_needed=reflection.get("suggestion")
	)

	def process_with_tools(self, query: str, forced_tools: List[str]) -> AgentResponse:
	"""Process query with explicitly specified tools."""
	tool_calls = []

	for tool_name in forced_tools:
	tool = get_tool(tool_name)
	if tool is None:
	continue

	try:
	result = tool()
	call = ToolCall(
	tool_name=tool_name,
	arguments={},
	result=result,
	success=result.get("success", False) if isinstance(result, dict) else True
	)
	except Exception as e:
	call = ToolCall(
	tool_name=tool_name,
	arguments={},
	error=str(e),
	success=False
	)

	tool_calls.append(call)

	response_content = self.response_generator.generate(tool_calls, "general", {})

	return AgentResponse(
	content=response_content,
	tool_calls=tool_calls,
	confidence=1.0
	)

	def get_context(self) -> str:
	"""Get current context as string."""
	return self.context_manager.get_workspace_context()

	def get_schemas(self) -> List[Dict[str, Any]]:
	"""Get tool schemas for tool calling."""
	return get_tool_schemas()


	def create_agent(workspace: Optional[str] = None) -> StackAgent:
	"""Factory function to create agent."""
	return StackAgent(workspace)


	if __name__ == "__main__":
	print("Stack 2.9 Agent Module")
	agent = create_agent()
	print(f"Agent initialized with {len(list_tools())} tools")

	# Test query
	response = agent.process("list my tasks")
	print(f"\nQuery: 'list my tasks'")
	print(f"Response: {response.content[:200]}")