robgreenberg3 commited on
Commit
61555f2
·
verified ·
1 Parent(s): f3a4627

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +31 -2
README.md CHANGED
@@ -1,4 +1,33 @@
1
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  <h1 style="display: flex; align-items: center; gap: 10px; margin: 0;">
3
  Kimi-K2-Instruct-quantized.w4a16
4
  <img src="https://www.redhat.com/rhdc/managed-files/Catalog-Validated_model_0.png" alt="Model Icon" width="40" style="margin: 0; padding: 0;" />
@@ -153,7 +182,7 @@ spec:
153
  name: vLLM
154
  containers:
155
  - name: kserve-container
156
- image: quay.io/modh/vllm:rhoai-2.24-cuda # CHANGE if needed. If AMD: quay.io/modh/vllm:rhoai-2.20-rocm
157
  command:
158
  - python
159
  - -m
 
1
+ ---
2
+ language:
3
+ - en
4
+ base_model:
5
+ - moonshotai/Kimi-K2-Instruct
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - kimi-k2
9
+ - MOE
10
+ - neuralmagic
11
+ - redhat
12
+ - llmcompressor
13
+ - quantized
14
+ - INT4
15
+ - GPTQ
16
+ - conversational
17
+ - compressed-tensors
18
+ license: other
19
+ license_name: modified-mit
20
+ name: RedHatAI/Kimi-K2-Instruct-quantized.w4a16
21
+ description: >-
22
+ This model was obtained by quantizing weights of moonshotai/Kimi-K2-Instruct to INT4 data
23
+ type.
24
+ readme: >-
25
+ https://huggingface.co/RedHatAI/Kimi-K2-Instruct-quantized.w4a16/main/README.md
26
+ tasks:
27
+ - text-to-text
28
+ provider: Moonshot AI
29
+ license_link: https://huggingface.co/moonshotai/Kimi-K2-Instruct/blob/main/LICENSE
30
+ ---
31
  <h1 style="display: flex; align-items: center; gap: 10px; margin: 0;">
32
  Kimi-K2-Instruct-quantized.w4a16
33
  <img src="https://www.redhat.com/rhdc/managed-files/Catalog-Validated_model_0.png" alt="Model Icon" width="40" style="margin: 0; padding: 0;" />
 
182
  name: vLLM
183
  containers:
184
  - name: kserve-container
185
+ image: quay.io/modh/vllm:rhoai-2.24-cuda # CHANGE if needed. If AMD: quay.io/modh/vllm:rhoai-2.24-rocm
186
  command:
187
  - python
188
  - -m