shreyask commited on
Commit
e059fae
·
verified ·
1 Parent(s): bf6eb86

fp16 WebGPU ONNX (no quantization, compatible ops)

Browse files
generation_config.json CHANGED
@@ -2,6 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
- "pad_token_id": 0,
6
- "transformers_version": "5.1.0"
7
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
+ "pad_token_id": 0
 
6
  }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d74269b82e2bddc5e82425ae0320d5a937d54e94a26cd536a97b68ac17d6a5db
3
- size 171599
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:292bad950fe2cddf413b119d71e6972eb84c1da9b5805b5560ef55700d46fbd0
3
+ size 138095
onnx/model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b49370ce0d23a0d876b6f1ee6ad8b908c7a8e4c5c2994bb91bd7245cc52c4205
3
- size 943325184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e85523d5c8c5a57a4282fa24f69baee6aae1ae2c2087960b7bc3858fc192a420
3
+ size 2357067776