Spaces:

yahma
/

rwkv-instruct

Build error

gururise commited on Feb 9, 2023

Commit

750b68d

1 Parent(s): efafe5a

update config for 14b pre-quantized model

Files changed (1) hide show

config.py CHANGED Viewed

@@ -5,8 +5,8 @@ quantized = {
     "mode": TORCH_QUANT,
     "runtimedtype": torch.bfloat16,
     "useGPU": torch.cuda.is_available(),
-    "chunksize": 32,  # larger = more accurate, but more memory
-    "target": 100  # your gpu max size, excess vram offloaded to cpu
 }
 # UNCOMMENT TO SELECT OPTIONS
@@ -57,7 +57,20 @@ title = "RWKV-4 (1.5b Instruct Test 2)"
 # [File size: 28.0GB]
 # config = {
-#     "path": "https://huggingface.co/BlinkDL/rwkv-4-pile-14b/resolve/main/RWKV-4-Pile-14B-20230204-7324.pth"
 # }
-# title = "RWKV-4 (14b)"

     "mode": TORCH_QUANT,
     "runtimedtype": torch.bfloat16,
     "useGPU": torch.cuda.is_available(),
+    "chunksize": 32,  # larger = more accurate, but more memory (and slower)
+    "target": 24  # your gpu max size, excess vram offloaded to cpu
 }
 # UNCOMMENT TO SELECT OPTIONS
 # [File size: 28.0GB]
 # config = {
+#     "path": "https://huggingface.co/BlinkDL/rwkv-4-pile-14b/resolve/main/RWKV-4-Pile-14B-20230204-7324.pth",
+#     **quantized
+# }
+# title = "RWKV-4 (14b Quantized)"
+# RWKV 14B pre-quantized (latest as of feb 9)
+# Approximate
+# [Vram usage: 15.0GB]
+# [File size: 14.4GB]
+# config = {
+#     "path": "https://huggingface.co/Hazzzardous/RWKV-8Bit/resolve/main/RWKV-4-Pile-14B-20230204-7324.pqth"
 # }
+# title = "RWKV-4 (14b Quantized)"