JLake310 commited on
Commit
cc4f980
·
verified ·
1 Parent(s): dccb3f8

change precision to fp32

Browse files
mlc-chat-config.json CHANGED
@@ -27,7 +27,8 @@
27
  "context_window_size": 768,
28
  "prefill_chunk_size": 0,
29
  "max_batch_size": 80,
30
- "tensor_parallel_shards": 1
 
31
  },
32
  "vocab_size": 50265,
33
  "context_window_size": 768,
 
27
  "context_window_size": 768,
28
  "prefill_chunk_size": 0,
29
  "max_batch_size": 80,
30
+ "tensor_parallel_shards": 1,
31
+ "dtype": "float32"
32
  },
33
  "vocab_size": 50265,
34
  "context_window_size": 768,
roberta-cls-model-q0f32-android.tar CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aed76df6f74c17a1d9bc067b97bceb4ad064b0d8b05db9de9c061d2ee85e73d0
3
- size 112431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:127c68c8bcf0923fa75081acea5197cb48137a5a74f1f35c3c80c8533754ab4a
3
+ size 111882