Text Generation
Transformers
English
qwen2
code-generation
python
fine-tuning
Qwen
tools
agent-framework
multi-agent
conversational
Eval Results (legacy)
Instructions to use my-ai-stack/Stack-2-9-finetuned with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use my-ai-stack/Stack-2-9-finetuned with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("text-generation", model="my-ai-stack/Stack-2-9-finetuned") messages = [ {"role": "user", "content": "Who are you?"}, ] pipe(messages)# Load model directly from transformers import AutoTokenizer, AutoModelForCausalLM tokenizer = AutoTokenizer.from_pretrained("my-ai-stack/Stack-2-9-finetuned") model = AutoModelForCausalLM.from_pretrained("my-ai-stack/Stack-2-9-finetuned") messages = [ {"role": "user", "content": "Who are you?"}, ] inputs = tokenizer.apply_chat_template( messages, add_generation_prompt=True, tokenize=True, return_dict=True, return_tensors="pt", ).to(model.device) outputs = model.generate(**inputs, max_new_tokens=40) print(tokenizer.decode(outputs[0][inputs["input_ids"].shape[-1]:])) - Notebooks
- Google Colab
- Kaggle
- Local Apps
- vLLM
How to use my-ai-stack/Stack-2-9-finetuned with vLLM:
Install from pip and serve model
# Install vLLM from pip: pip install vllm # Start the vLLM server: vllm serve "my-ai-stack/Stack-2-9-finetuned" # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:8000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "my-ai-stack/Stack-2-9-finetuned", "messages": [ { "role": "user", "content": "What is the capital of France?" } ] }'Use Docker
docker model run hf.co/my-ai-stack/Stack-2-9-finetuned
- SGLang
How to use my-ai-stack/Stack-2-9-finetuned with SGLang:
Install from pip and serve model
# Install SGLang from pip: pip install sglang # Start the SGLang server: python3 -m sglang.launch_server \ --model-path "my-ai-stack/Stack-2-9-finetuned" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "my-ai-stack/Stack-2-9-finetuned", "messages": [ { "role": "user", "content": "What is the capital of France?" } ] }'Use Docker images
docker run --gpus all \ --shm-size 32g \ -p 30000:30000 \ -v ~/.cache/huggingface:/root/.cache/huggingface \ --env "HF_TOKEN=<secret>" \ --ipc=host \ lmsysorg/sglang:latest \ python3 -m sglang.launch_server \ --model-path "my-ai-stack/Stack-2-9-finetuned" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "my-ai-stack/Stack-2-9-finetuned", "messages": [ { "role": "user", "content": "What is the capital of France?" } ] }' - Docker Model Runner
How to use my-ai-stack/Stack-2-9-finetuned with Docker Model Runner:
docker model run hf.co/my-ai-stack/Stack-2-9-finetuned
| """ | |
| Stack 2.9 Enhancement Configuration | |
| Central configuration for all enhancement features. | |
| """ | |
| from dataclasses import dataclass, field | |
| from typing import Optional | |
| import os | |
| class NLPConfig: | |
| """Configuration for NLP enhancements.""" | |
| use_bert_embeddings: bool = True | |
| bert_model: str = "bert-base-uncased" | |
| use_entity_recognition: bool = True | |
| use_intent_detection: bool = True | |
| max_context_length: int = 512 | |
| embedding_cache_size: int = 1000 | |
| class KnowledgeGraphConfig: | |
| """Configuration for knowledge graph.""" | |
| enabled: bool = True | |
| backend: str = "networkx" # or "neo4j" | |
| max_nodes: int = 10000 | |
| max_edges: int = 50000 | |
| similarity_threshold: float = 0.7 | |
| rag_enabled: bool = True | |
| rag_top_k: int = 5 | |
| class EmotionalIntelligenceConfig: | |
| """Configuration for emotional intelligence.""" | |
| enabled: bool = True | |
| sentiment_model: str = "distilbert-base-uncased-finetuned-sst-2-english" | |
| detect_emotions: bool = True | |
| empathetic_responses: bool = True | |
| emotion_sensitivity: float = 0.5 | |
| class CollaborationConfig: | |
| """Configuration for collaboration features.""" | |
| mcp_enabled: bool = True | |
| conversation_state_enabled: bool = True | |
| max_sessions: int = 10 | |
| session_timeout_minutes: int = 60 | |
| class LearningConfig: | |
| """Configuration for learning and adaptation.""" | |
| enabled: bool = True | |
| feedback_storage_path: str = "data/feedback" | |
| auto_finetune: bool = False | |
| finetune_every_n_feedback: int = 100 | |
| performance_monitoring: bool = True | |
| class EnhancementConfig: | |
| """Main configuration for all enhancements.""" | |
| nlp: NLPConfig = field(default_factory=NLPConfig) | |
| knowledge_graph: KnowledgeGraphConfig = field(default_factory=KnowledgeGraphConfig) | |
| emotional_intelligence: EmotionalIntelligenceConfig = field(default_factory=EmotionalIntelligenceConfig) | |
| collaboration: CollaborationConfig = field(default_factory=CollaborationConfig) | |
| learning: LearningConfig = field(default_factory=LearningConfig) | |
| # Global enable/disable | |
| all_enabled: bool = True | |
| def from_env(cls) -> "EnhancementConfig": | |
| """Create config from environment variables.""" | |
| config = cls() | |
| # NLP settings | |
| if os.getenv("NLP_USE_BERT"): | |
| config.nlp.use_bert_embeddings = os.getenv("NLP_USE_BERT").lower() == "true" | |
| if os.getenv("NLP_BERT_MODEL"): | |
| config.nlp.bert_model = os.getenv("NLP_BERT_MODEL") | |
| # Knowledge graph settings | |
| if os.getenv("KG_ENABLED"): | |
| config.knowledge_graph.enabled = os.getenv("KG_ENABLED").lower() == "true" | |
| if os.getenv("KG_RAG_ENABLED"): | |
| config.knowledge_graph.rag_enabled = os.getenv("KG_RAG_ENABLED").lower() == "true" | |
| # Emotional intelligence settings | |
| if os.getenv("EI_ENABLED"): | |
| config.emotional_intelligence.enabled = os.getenv("EI_ENABLED").lower() == "true" | |
| # Learning settings | |
| if os.getenv("LEARNING_ENABLED"): | |
| config.learning.enabled = os.getenv("LEARNING_ENABLED").lower() == "true" | |
| return config | |
| # Global config instance | |
| _default_config: Optional[EnhancementConfig] = None | |
| def get_config() -> EnhancementConfig: | |
| """Get the global enhancement config instance.""" | |
| global _default_config | |
| if _default_config is None: | |
| _default_config = EnhancementConfig.from_env() | |
| return _default_config | |
| def set_config(config: EnhancementConfig) -> None: | |
| """Set the global enhancement config instance.""" | |
| global _default_config | |
| _default_config = config |