JunHowie commited on
Commit
a838c55
·
verified ·
1 Parent(s): 98c1be3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -5
README.md CHANGED
@@ -6,12 +6,12 @@ tags:
6
  - vLLM
7
  - AWQ
8
  base_model:
9
- - ZhipuAI/GLM-5
10
  base_model_relation: quantized
11
 
12
  ---
13
  # GLM-5-AWQ
14
- Base model: [ZhipuAI/GLM-5](https://www.modelscope.cn/models/ZhipuAI/GLM-5)
15
 
16
  This repo quantizes the model using data-free quantization (no calibration dataset required).
17
 
@@ -47,7 +47,7 @@ export VLLM_USE_FLASHINFER_SAMPLER=0
47
  export OMP_NUM_THREADS=4
48
 
49
  vllm serve \
50
- __YOUR_PATH__/tclf90/GLM-5-AWQ \
51
  --served-model-name MY_MODEL \
52
  --swap-space 16 \
53
  --max-num-seqs 32 \
@@ -77,8 +77,8 @@ vllm serve \
77
 
78
  ### 【Model Download】
79
  ```python
80
- from modelscope import snapshot_download
81
- snapshot_download('tclf90/GLM-5-AWQ', cache_dir="your_local_path")
82
  ```
83
 
84
  ### 【Overview】
 
6
  - vLLM
7
  - AWQ
8
  base_model:
9
+ - zai-org/GLM-5
10
  base_model_relation: quantized
11
 
12
  ---
13
  # GLM-5-AWQ
14
+ Base model: [zai-org/GLM-5](https://huggingface.co/zai-org/GLM-5)
15
 
16
  This repo quantizes the model using data-free quantization (no calibration dataset required).
17
 
 
47
  export OMP_NUM_THREADS=4
48
 
49
  vllm serve \
50
+ __YOUR_PATH__/QuantTrio/GLM-5-AWQ \
51
  --served-model-name MY_MODEL \
52
  --swap-space 16 \
53
  --max-num-seqs 32 \
 
77
 
78
  ### 【Model Download】
79
  ```python
80
+ from huggingface_hub import snapshot_download
81
+ snapshot_download('QuantTrio/GLM-5-AWQ', cache_dir="your_local_path")
82
  ```
83
 
84
  ### 【Overview】