Spaces:
Build error
Build error
update config for 14b pre-quantized model
Browse files
config.py
CHANGED
|
@@ -5,8 +5,8 @@ quantized = {
|
|
| 5 |
"mode": TORCH_QUANT,
|
| 6 |
"runtimedtype": torch.bfloat16,
|
| 7 |
"useGPU": torch.cuda.is_available(),
|
| 8 |
-
"chunksize": 32, # larger = more accurate, but more memory
|
| 9 |
-
"target":
|
| 10 |
}
|
| 11 |
|
| 12 |
# UNCOMMENT TO SELECT OPTIONS
|
|
@@ -57,7 +57,20 @@ title = "RWKV-4 (1.5b Instruct Test 2)"
|
|
| 57 |
# [File size: 28.0GB]
|
| 58 |
|
| 59 |
# config = {
|
| 60 |
-
# "path": "https://huggingface.co/BlinkDL/rwkv-4-pile-14b/resolve/main/RWKV-4-Pile-14B-20230204-7324.pth"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 61 |
# }
|
| 62 |
|
| 63 |
-
# title = "RWKV-4 (14b)"
|
|
|
|
| 5 |
"mode": TORCH_QUANT,
|
| 6 |
"runtimedtype": torch.bfloat16,
|
| 7 |
"useGPU": torch.cuda.is_available(),
|
| 8 |
+
"chunksize": 32, # larger = more accurate, but more memory (and slower)
|
| 9 |
+
"target": 24 # your gpu max size, excess vram offloaded to cpu
|
| 10 |
}
|
| 11 |
|
| 12 |
# UNCOMMENT TO SELECT OPTIONS
|
|
|
|
| 57 |
# [File size: 28.0GB]
|
| 58 |
|
| 59 |
# config = {
|
| 60 |
+
# "path": "https://huggingface.co/BlinkDL/rwkv-4-pile-14b/resolve/main/RWKV-4-Pile-14B-20230204-7324.pth",
|
| 61 |
+
# **quantized
|
| 62 |
+
# }
|
| 63 |
+
|
| 64 |
+
# title = "RWKV-4 (14b Quantized)"
|
| 65 |
+
|
| 66 |
+
|
| 67 |
+
# RWKV 14B pre-quantized (latest as of feb 9)
|
| 68 |
+
# Approximate
|
| 69 |
+
# [Vram usage: 15.0GB]
|
| 70 |
+
# [File size: 14.4GB]
|
| 71 |
+
|
| 72 |
+
# config = {
|
| 73 |
+
# "path": "https://huggingface.co/Hazzzardous/RWKV-8Bit/resolve/main/RWKV-4-Pile-14B-20230204-7324.pqth"
|
| 74 |
# }
|
| 75 |
|
| 76 |
+
# title = "RWKV-4 (14b Quantized)"
|