Instructions to use my-ai-stack/Stack-2-9-finetuned with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use my-ai-stack/Stack-2-9-finetuned with Transformers:

# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-generation", model="my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
pipe(messages)

# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
model = AutoModelForCausalLM.from_pretrained("my-ai-stack/Stack-2-9-finetuned")
messages = [
    {"role": "user", "content": "Who are you?"},
]
inputs = tokenizer.apply_chat_template(
	messages,
	add_generation_prompt=True,
	tokenize=True,
	return_dict=True,
	return_tensors="pt",
).to(model.device)

outputs = model.generate(**inputs, max_new_tokens=40)
print(tokenizer.decode(outputs[0][inputs["input_ids"].shape[-1]:]))

Notebooks
Google Colab
Kaggle
Local Apps

vLLM

How to use my-ai-stack/Stack-2-9-finetuned with vLLM:

Install from pip and serve model

# Install vLLM from pip:
pip install vllm
# Start the vLLM server:
vllm serve "my-ai-stack/Stack-2-9-finetuned"
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:8000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker

docker model run hf.co/my-ai-stack/Stack-2-9-finetuned

SGLang

How to use my-ai-stack/Stack-2-9-finetuned with SGLang:

Install from pip and serve model

# Install SGLang from pip:
pip install sglang
# Start the SGLang server:
python3 -m sglang.launch_server \
    --model-path "my-ai-stack/Stack-2-9-finetuned" \
    --host 0.0.0.0 \
    --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Use Docker images

docker run --gpus all \
    --shm-size 32g \
    -p 30000:30000 \
    -v ~/.cache/huggingface:/root/.cache/huggingface \
    --env "HF_TOKEN=<secret>" \
    --ipc=host \
    lmsysorg/sglang:latest \
    python3 -m sglang.launch_server \
        --model-path "my-ai-stack/Stack-2-9-finetuned" \
        --host 0.0.0.0 \
        --port 30000
# Call the server using curl (OpenAI-compatible API):
curl -X POST "http://localhost:30000/v1/chat/completions" \
	-H "Content-Type: application/json" \
	--data '{
		"model": "my-ai-stack/Stack-2-9-finetuned",
		"messages": [
			{
				"role": "user",
				"content": "What is the capital of France?"
			}
		]
	}'

Docker Model Runner
How to use my-ai-stack/Stack-2-9-finetuned with Docker Model Runner:
```
docker model run hf.co/my-ai-stack/Stack-2-9-finetuned
```

Stack-2-9-finetuned / src /enhancements /config.py

walidsobhie-code

feat: Add comprehensive enhancement modules for Stack 2.9

8f05ad1 about 2 months ago

raw

history blame contribute delete

3.67 kB

	"""
	Stack 2.9 Enhancement Configuration
	Central configuration for all enhancement features.
	"""

	from dataclasses import dataclass, field
	from typing import Optional
	import os


	@dataclass
	class NLPConfig:
	"""Configuration for NLP enhancements."""
	use_bert_embeddings: bool = True
	bert_model: str = "bert-base-uncased"
	use_entity_recognition: bool = True
	use_intent_detection: bool = True
	max_context_length: int = 512
	embedding_cache_size: int = 1000


	@dataclass
	class KnowledgeGraphConfig:
	"""Configuration for knowledge graph."""
	enabled: bool = True
	backend: str = "networkx" # or "neo4j"
	max_nodes: int = 10000
	max_edges: int = 50000
	similarity_threshold: float = 0.7
	rag_enabled: bool = True
	rag_top_k: int = 5


	@dataclass
	class EmotionalIntelligenceConfig:
	"""Configuration for emotional intelligence."""
	enabled: bool = True
	sentiment_model: str = "distilbert-base-uncased-finetuned-sst-2-english"
	detect_emotions: bool = True
	empathetic_responses: bool = True
	emotion_sensitivity: float = 0.5


	@dataclass
	class CollaborationConfig:
	"""Configuration for collaboration features."""
	mcp_enabled: bool = True
	conversation_state_enabled: bool = True
	max_sessions: int = 10
	session_timeout_minutes: int = 60


	@dataclass
	class LearningConfig:
	"""Configuration for learning and adaptation."""
	enabled: bool = True
	feedback_storage_path: str = "data/feedback"
	auto_finetune: bool = False
	finetune_every_n_feedback: int = 100
	performance_monitoring: bool = True


	@dataclass
	class EnhancementConfig:
	"""Main configuration for all enhancements."""
	nlp: NLPConfig = field(default_factory=NLPConfig)
	knowledge_graph: KnowledgeGraphConfig = field(default_factory=KnowledgeGraphConfig)
	emotional_intelligence: EmotionalIntelligenceConfig = field(default_factory=EmotionalIntelligenceConfig)
	collaboration: CollaborationConfig = field(default_factory=CollaborationConfig)
	learning: LearningConfig = field(default_factory=LearningConfig)

	# Global enable/disable
	all_enabled: bool = True

	@classmethod
	def from_env(cls) -> "EnhancementConfig":
	"""Create config from environment variables."""
	config = cls()

	# NLP settings
	if os.getenv("NLP_USE_BERT"):
	config.nlp.use_bert_embeddings = os.getenv("NLP_USE_BERT").lower() == "true"
	if os.getenv("NLP_BERT_MODEL"):
	config.nlp.bert_model = os.getenv("NLP_BERT_MODEL")

	# Knowledge graph settings
	if os.getenv("KG_ENABLED"):
	config.knowledge_graph.enabled = os.getenv("KG_ENABLED").lower() == "true"
	if os.getenv("KG_RAG_ENABLED"):
	config.knowledge_graph.rag_enabled = os.getenv("KG_RAG_ENABLED").lower() == "true"

	# Emotional intelligence settings
	if os.getenv("EI_ENABLED"):
	config.emotional_intelligence.enabled = os.getenv("EI_ENABLED").lower() == "true"

	# Learning settings
	if os.getenv("LEARNING_ENABLED"):
	config.learning.enabled = os.getenv("LEARNING_ENABLED").lower() == "true"

	return config


	# Global config instance
	_default_config: Optional[EnhancementConfig] = None


	def get_config() -> EnhancementConfig:
	"""Get the global enhancement config instance."""
	global _default_config
	if _default_config is None:
	_default_config = EnhancementConfig.from_env()
	return _default_config


	def set_config(config: EnhancementConfig) -> None:
	"""Set the global enhancement config instance."""
	global _default_config
	_default_config = config