Duplicate from lakhera2023/devops-slm-v1

Browse files

Co-authored-by: Prashant Lakhera <lakhera2023@users.noreply.huggingface.co>

Files changed (11) hide show

.gitattributes +36 -0
README.md +96 -0
adapter_config.json +44 -0
adapter_model.safetensors +3 -0
added_tokens.json +24 -0
chat_template.jinja +86 -0
merges.txt +0 -0
special_tokens_map.json +31 -0
tokenizer.json +3 -0
tokenizer_config.json +47 -0
vocab.json +0 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,36 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,96 @@

+---
+license: apache-2.0
+tags:
+- devops
+- kubernetes
+- docker
+- ci-cd
+- infrastructure
+- monitoring
+- specialized
+pipeline_tag: text-generation
+---
+# DevOps Specialized Language Model v1
+## 🎯 Model Overview
+This is a **specialized language model** specifically for **DevOps tasks and operations only**.
+## ⚠️ Important Notice
+**This model is designed EXCLUSIVELY for DevOps-related tasks. It has robust filtering that will NOT respond to general questions about movies, weather, cooking, sports, music, travel, health, education, politics, religion, philosophy, entertainment, gaming, fashion, or any non-DevOps topics.**
+**The model will automatically redirect any non-DevOps questions back to DevOps topics.**
+## 🚀 Capabilities
+The model specializes in:
+- **Kubernetes Operations**: Deployments, pods, services, troubleshooting
+- **Docker Containerization**: Container management, Dockerfiles, best practices
+- **CI/CD Pipelines**: GitHub Actions, GitLab CI, Jenkins, automation
+- **Infrastructure Automation**: Terraform, Ansible, infrastructure as code
+- **Monitoring & Observability**: Logging, metrics, alerting, performance monitoring
+- **Cloud Platform Operations**: AWS, Azure, GCP, cloud-native solutions
+- **DevOps Tools**: Helm, Prometheus, Grafana, ELK stack, and more
+## 🚫 Limitations
+- **DevOps Only**: Will not respond to non-DevOps questions
+- **Specialized Knowledge**: Focused on DevOps practices and tools
+## 💻 Usage
+### Basic Usage
+https://colab.research.google.com/drive/1UgTUI6AeVnSlknHoF3cEDhWLHYirghju?usp=sharing
+### Example Queries
+✅ **Good DevOps Questions:**
+- "How do I create a Kubernetes deployment?"
+- "What's the difference between Docker and Podman?"
+- "How do I set up a CI/CD pipeline with GitHub Actions?"
+- "How do I troubleshoot a failing Kubernetes pod?"
+- "What are the best practices for container security?"
+❌ **Non-DevOps Questions (will be redirected):**
+- "Tell me about movies" → Redirected to DevOps
+- "What's the weather like?" → Redirected to DevOps
+- "Explain quantum physics" → Redirected to DevOps
+- "Write a poem" → Redirected to DevOps
+- "How to cook pasta?" → Redirected to DevOps
+- "Who won the football game?" → Redirected to DevOps
+- "Recommend some music" → Redirected to DevOps
+- "Best travel destinations" → Redirected to DevOps
+## 🔧 Technical Details
+- **Base Model**: lakhera2023/Qwen-model
+- **Architecture**: Transformer-based with LoRA fine-tuning
+- **Training**: DevOps-specific examples
+- **Specialization**: Fine-tuned for DevOps tasks only
+## 📊 Performance
+This model is optimized for:
+- **DevOps Task Accuracy**: High precision on DevOps-related queries
+- **Response Quality**: Clear, actionable DevOps guidance
+- **Topic Focus**: Strict adherence to DevOps-only responses
+## 🤝 Contributing
+This model is specialized for the DevOps community. If you have suggestions for improvements or additional DevOps training data, please open an issue.
+## 📄 License
+This model is released under the Apache 2.0 License.
+## ⚠️ Disclaimer
+This model is designed for educational and professional DevOps use. Always verify any deployment or configuration advice in a safe environment before applying to production systems.
+---
+**Remember: This model is DevOps-only. It will not respond to general questions.**

adapter_config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "lakhera2023/Qwen-model",
+  "bias": "none",
+  "corda_config": null,
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.1,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "qalora_group_size": 16,
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "down_proj",
+    "up_proj",
+    "gate_proj",
+    "q_proj",
+    "v_proj",
+    "k_proj",
+    "o_proj"
+  ],
+  "target_parameters": null,
+  "task_type": "CAUSAL_LM",
+  "trainable_token_indices": null,
+  "use_dora": false,
+  "use_qalora": false,
+  "use_rslora": false,
+  "model_name": "DevOps-SLM-v1",
+  "model_type": "devops_specialized"
+}

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0d30c7a80215bc335d9888d6eeaed14a5f9341b2eea123d883ef9976cebd24f
+size 73911112

added_tokens.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "</tool_call>": 151658,
+  "<tool_call>": 151657,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,86 @@

+{%- if tools %}
+    {{- '<|im_start|>system
+' }}
+    {%- if messages[0]['role'] == 'system' %}
+        {{- messages[0]['content'] }}
+    {%- else %}
+        {{- 'You are a specialized DevOps assistant. You ONLY help with DevOps-related topics like Kubernetes, Docker, CI/CD, infrastructure automation, monitoring, and cloud operations. If asked about non-DevOps topics (movies, weather, cooking, sports, music, travel, health, education, politics, religion, philosophy, entertainment, gaming, fashion, or any other non-DevOps topics), you MUST politely refuse and redirect to DevOps topics. You are NOT a general assistant.' }}
+    {%- endif %}
+    {{- "
+# Tools
+You may call one or more functions to assist with the user query.
+You are provided with function signatures within <tools></tools> XML tags:
+<tools>" }}
+    {%- for tool in tools %}
+        {{- "
+" }}
+        {{- tool | tojson }}
+    {%- endfor %}
+    {{- "
+</tools>
+For each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:
+<tool_call>
+{"name": <function-name>, "arguments": <args-json-object>}
+</tool_call><|im_end|>
+" }}
+{%- else %}
+    {%- if messages[0]['role'] == 'system' %}
+        {{- '<|im_start|>system
+' + messages[0]['content'] + '<|im_end|>
+' }}
+    {%- else %}
+        {{- '<|im_start|>system
+You are a specialized DevOps assistant. You ONLY help with DevOps-related topics like Kubernetes, Docker, CI/CD, infrastructure automation, monitoring, and cloud operations. If asked about non-DevOps topics (movies, weather, cooking, sports, music, travel, health, education, politics, religion, philosophy, entertainment, gaming, fashion, or any other non-DevOps topics), you MUST politely refuse and redirect to DevOps topics. You are NOT a general assistant.<|im_end|>
+' }}
+    {%- endif %}
+{%- endif %}
+{%- for message in messages %}
+    {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %}
+        {{- '<|im_start|>' + message.role + '
+' + message.content + '<|im_end|>' + '
+' }}
+    {%- elif message.role == "assistant" %}
+        {{- '<|im_start|>' + message.role }}
+        {%- if message.content %}
+            {{- '
+' + message.content }}
+        {%- endif %}
+        {%- for tool_call in message.tool_calls %}
+            {%- if tool_call.function is defined %}
+                {%- set tool_call = tool_call.function %}
+            {%- endif %}
+            {{- '
+<tool_call>
+{"name": "' }}
+            {{- tool_call.name }}
+            {{- '", "arguments": ' }}
+            {{- tool_call.arguments | tojson }}
+            {{- '}
+</tool_call>' }}
+        {%- endfor %}
+        {{- '<|im_end|>
+' }}
+    {%- elif message.role == "tool" %}
+        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %}
+            {{- '<|im_start|>user' }}
+        {%- endif %}
+        {{- '
+<tool_response>
+' }}
+        {{- message.content }}
+        {{- '
+</tool_response>' }}
+        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
+            {{- '<|im_end|>
+' }}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant
+' }}
+{%- endif %}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb0180d9179612e308a799d915cf8ccbcced4a006b9562e78fa1121cc61cc1b5
+size 11422162

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|endoftext|>"
+  ],
+  "bos_token": "<|im_start|>",
+  "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\\nYou are a specialized DevOps assistant. You help with DevOps tasks only.<|im_end|>\\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\\n' + message['content'] + '<|im_end|>' + '\\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\\n' }}{% endif %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "model_max_length": 32768,
+  "pad_token": "<|endoftext|>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "unk_token": "<|endoftext|>",
+  "use_fast": true,
+  "vocab_size": 151646
+}

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff