Instructions to use my-ai-stack/Stack-2-9-finetuned with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use my-ai-stack/Stack-2-9-finetuned with Transformers:

# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-generation", model="my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
pipe(messages)

# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
model = AutoModelForCausalLM.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
inputs = tokenizer.apply_chat_template(
	messages,
	add_generation_prompt=True,
	tokenize=True,
	return_dict=True,
	return_tensors="pt",
).to(model.device)

outputs = model.generate(**inputs, max_new_tokens=40)
print(tokenizer.decode(outputs[0][inputs["input_ids"].shape[-1]:]))

Notebooks
Google Colab
Kaggle
Local Apps

vLLM

How to use my-ai-stack/Stack-2-9-finetuned with vLLM:

Install from pip and serve model

# Install vLLM from pip:
pip install vllm
# Start the vLLM server:
vllm serve "my-ai-stack/Stack-2-9-finetuned"
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:8000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker

docker model run hf.co/my-ai-stack/Stack-2-9-finetuned

SGLang

How to use my-ai-stack/Stack-2-9-finetuned with SGLang:

Install from pip and serve model

# Install SGLang from pip:
pip install sglang
# Start the SGLang server:
python3 -m sglang.launch_server \
    --model-path "my-ai-stack/Stack-2-9-finetuned" \
    --host 0.0.0.0 \
    --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker images

docker run --gpus all \
    --shm-size 32g \
    -p 30000:30000 \
    -v ~/.cache/huggingface:/root/.cache/huggingface \
    --env "HF_TOKEN=<secret>" \
    --ipc=host \
    lmsysorg/sglang:latest \
    python3 -m sglang.launch_server \
        --model-path "my-ai-stack/Stack-2-9-finetuned" \
        --host 0.0.0.0 \
        --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Docker Model Runner
How to use my-ai-stack/Stack-2-9-finetuned with Docker Model Runner:
```
docker model run hf.co/my-ai-stack/Stack-2-9-finetuned
```

Stack-2-9-finetuned / scripts /augment_training_data.py

walidsobhie-code

feat: add production infrastructure - CI/CD, Docker, code quality, and monitoring

b5998ff about 2 months ago

raw

history blame

11.8 kB

	#!/usr/bin/env python3
	"""
	Data augmentation script for tool_examples.jsonl.
	Generates 2x-5x more training examples from existing data through:
	- Paraphrasing user prompts
	- Difficulty scaling (simpler/complex variations)
	- Edge case generation
	"""

	import json
	import random
	import argparse
	from pathlib import Path
	from typing import List, Dict, Any, Optional
	from itertools import product
	import copy

	# Random seed for reproducibility
	random.seed(42)

	# Paraphrase templates
	PARAPHRASES = {
	"Can you": ["Please", "Would you kindly", "Could you", "Kindly"],
	"I need": ["I'd like", "I require", "I want", "I must have"],
	"show me": ["display", "show", "reveal", "let me see"],
	"the file": ["this file", "that file", "a file"],
	"run": ["execute", "launch", "start", "run"],
	"create": ["make", "generate", "add", "write"],
	"delete": ["remove", "erase", "drop", "destroy"],
	"list": ["show", "display", "enumerate", "get"],
	"search": ["find", "look for", "grep", "locate"],
	"help me": ["assist me", "I need help", "please assist", "support"],
	}

	# Difficulty modifiers
	EASY_MODIFIERS = [
	"quickly",
	"simply",
	"just",
	"easily",
	]

	COMPLEX_MODIFIERS = [
	"carefully",
	"thoroughly",
	"in detail",
	"completely",
	"with all options",
	]

	# Edge case patterns
	EDGE_CASE_PATTERNS = [
	("empty_input", lambda ex: _create_empty_variant(ex)),
	("multi_step", lambda ex: _create_multistep_variant(ex)),
	("error_handling", lambda ex: _create_error_variant(ex)),
	]


	def _deep_copy(obj: Any) -> Any:
	"""Create a deep copy of a JSON-serializable object."""
	return json.loads(json.dumps(obj))


	def _create_empty_variant(example: Dict[str, Any]) -> Optional[Dict[str, Any]]:
	"""Create variant with empty/blank user input."""
	new_ex = _deep_copy(example)
	# Keep system message, empty user message
	for msg in new_ex["messages"]:
	if msg["role"] == "user":
	msg["content"] = " "
	break
	new_ex["source"] = "augmented_edge_empty"
	return new_ex


	def _create_multistep_variant(example: Dict[str, Any]) -> Optional[Dict[str, Any]]:
	"""Create variant simulating multi-step reasoning."""
	new_ex = _deep_copy(example)
	# Add reasoning step before tool call
	for i, msg in enumerate(new_ex["messages"]):
	if msg.get("tool_calls"):
	reasoning = {
	"role": "assistant",
	"content": "Let me think about this step by step. First, I need to understand what the user is asking for."
	}
	new_ex["messages"].insert(i, reasoning)
	break
	new_ex["source"] = "augmented_edge_multistep"
	return new_ex


	def _create_error_variant(example: Dict[str, Any]) -> Optional[Dict[str, Any]]:
	"""Create variant simulating error handling."""
	new_ex = _deep_copy(example)
	for msg in new_ex["messages"]:
	if msg.get("role") == "tool":
	# Simulate an error in tool result
	if "Successfully" in msg.get("content", ""):
	msg["content"] = msg["content"].replace("Successfully", "Error occurred:")
	elif "error" not in msg.get("content", "").lower():
	msg["content"] = "Operation failed: Permission denied"
	break
	new_ex["source"] = "augmented_edge_error"
	return new_ex


	def paraphrase_text(text: str) -> str:
	"""Apply simple paraphrasing to text."""
	if not text:
	return text
	result = text
	for original, alternatives in PARAPHRASES.items():
	if original.lower() in result.lower():
	# Case-insensitive replace, preserve original case pattern
	idx = result.lower().find(original.lower())
	prefix = result[:idx]
	suffix = result[idx + len(original):]
	replacement = random.choice(alternatives)
	# Preserve case
	if result[idx].isupper():
	replacement = replacement.capitalize()
	result = prefix + replacement + suffix
	break
	return result


	def apply_difficulty(example: Dict[str, Any], level: str) -> Dict[str, Any]:
	"""Apply difficulty scaling to an example."""
	new_ex = _deep_copy(example)
	modifiers = EASY_MODIFIERS if level == "easy" else COMPLEX_MODIFIERS

	for msg in new_ex["messages"]:
	if msg["role"] == "user" and msg.get("content"):
	content = msg["content"]
	if level == "easy":
	# Simplify the request
	content = content.replace("please", "").replace("kindly", "")
	content = content.strip()
	elif level == "complex":
	# Add complexity
	modifier = random.choice(modifiers)
	content = f"{content} {modifier}"
	msg["content"] = content
	break

	new_ex["source"] = f"augmented_difficulty_{level}"
	return new_ex


	def vary_tool_parameters(example: Dict[str, Any]) -> List[Dict[str, Any]]:
	"""Generate variations with different tool parameters."""
	variations = []

	for msg in example.get("messages", []):
	if msg.get("tool_calls"):
	for tc in msg["tool_calls"]:
	func = tc.get("function", {})
	args_str = func.get("arguments", "{}")
	try:
	args = json.loads(args_str) if isinstance(args_str, str) else args_str
	except (json.JSONDecodeError, TypeError):
	continue

	if not isinstance(args, dict):
	continue

	# Common parameter variations
	param_variations = [
	("file_path", ["src/main.py", "README.md", "config.yaml", "package.json", "tests/test.py"]),
	("command", ["ls -la", "echo hello", "pwd", "whoami"]),
	("pattern", [".py", ".js", ".md", ".json"]),
	("path", ["src", "lib", "docs", "."]),
	]

	for param_name, alternatives in param_variations:
	if param_name in args:
	original_val = args[param_name]
	for alt_val in alternatives:
	if alt_val != original_val:
	new_ex = _deep_copy(example)
	for new_msg in new_ex["messages"]:
	if new_msg.get("tool_calls"):
	for new_tc in new_msg["tool_calls"]:
	new_func = new_tc.get("function", {})
	new_args = json.loads(new_func.get("arguments", "{}"))
	if param_name in new_args:
	new_args[param_name] = alt_val
	new_func["arguments"] = json.dumps(new_args)
	new_ex["source"] = "augmented_params"
	variations.append(new_ex)
	break

	return variations


	def add_filler_variant(example: Dict[str, Any]) -> Optional[Dict[str, Any]]:
	"""Add polite filler words to user message."""
	fillers = [" please", " if you could", " when you get a chance", " thanks"]

	new_ex = _deep_copy(example)
	for msg in new_ex["messages"]:
	if msg["role"] == "user" and msg.get("content"):
	filler = random.choice(fillers)
	msg["content"] = msg["content"].rstrip() + filler
	break

	new_ex["source"] = "augmented_filler"
	return new_ex


	def generate_edge_cases(example: Dict[str, Any], num_cases: int = 2) -> List[Dict[str, Any]]:
	"""Generate edge case variations."""
	cases = []
	selected_patterns = random.sample(EDGE_CASE_PATTERNS, min(num_cases, len(EDGE_CASE_PATTERNS)))

	for name, generator in selected_patterns:
	try:
	variant = generator(example)
	if variant:
	cases.append(variant)
	except Exception:
	continue

	return cases


	def augment_example(example: Dict[str, Any], target_multiplier: int = 3) -> List[Dict[str, Any]]:
	"""Generate multiple augmented variations of a single example."""
	variations = [example] # Always keep original

	# 1. Paraphrase variant
	if random.random() < 0.7:
	new_ex = _deep_copy(example)
	for msg in new_ex["messages"]:
	if msg["role"] == "user" and msg.get("content"):
	msg["content"] = paraphrase_text(msg["content"])
	break
	new_ex["source"] = "augmented_paraphrase"
	variations.append(new_ex)

	# 2. Difficulty variants (easy and complex)
	if random.random() < 0.5:
	variations.append(apply_difficulty(example, "easy"))
	if random.random() < 0.5:
	variations.append(apply_difficulty(example, "complex"))

	# 3. Filler variant
	if random.random() < 0.3:
	filler_ex = add_filler_variant(example)
	if filler_ex:
	variations.append(filler_ex)

	# 4. Tool parameter variations
	param_variations = vary_tool_parameters(example)
	variations.extend(param_variations[:2]) # Limit to 2

	# 5. Edge cases
	if random.random() < 0.3:
	edge_cases = generate_edge_cases(example)
	variations.extend(edge_cases[:1])

	return variations[:target_multiplier] # Limit total variations


	def main():
	parser = argparse.ArgumentParser(description="Augment training data for Stack 2.9")
	parser.add_argument("--input", type=str,
	default="training-data/tool_examples.jsonl",
	help="Input JSONL file")
	parser.add_argument("--output", type=str,
	default="training-data/augmented_tool_examples.jsonl",
	help="Output JSONL file")
	parser.add_argument("--multiplier", type=int, default=3,
	help="Target multiplication factor (2-5)")
	parser.add_argument("--seed", type=int, default=42,
	help="Random seed for reproducibility")

	args = parser.parse_args()
	random.seed(args.seed)

	input_path = Path(args.input)
	output_path = Path(args.output)

	if not input_path.exists():
	print(f"Error: Input file not found: {input_path}")
	return

	print(f"Loading data from: {input_path}")
	examples = []
	with open(input_path, 'r', encoding='utf-8') as f:
	for line in f:
	line = line.strip()
	if line:
	try:
	examples.append(json.loads(line))
	except json.JSONDecodeError:
	continue

	original_count = len(examples)
	print(f"Loaded {original_count} examples")

	# Generate augmented examples
	all_variations = []
	for ex in examples:
	variations = augment_example(ex, target_multiplier=args.multiplier)
	all_variations.extend(variations)

	total_count = len(all_variations)

	# Write output
	output_path.parent.mkdir(parents=True, exist_ok=True)
	with open(output_path, 'w', encoding='utf-8') as f:
	for var in all_variations:
	f.write(json.dumps(var, ensure_ascii=False) + "\n")

	print(f"\nAugmentation complete!")
	print(f" Original: {original_count} examples")
	print(f" Augmented: {total_count} examples")
	print(f" Multiplier: {total_count/original_count:.1f}x")
	print(f" Output: {output_path}")


	if __name__ == "__main__":
	main()