lwanming commited on
Commit
e14e7cc
·
verified ·
1 Parent(s): 50472f1

Upload 4 files

Browse files
.gitattributes CHANGED
@@ -37,3 +37,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
37
  1_prefill_INT4_128.onnx.data filter=lfs diff=lfs merge=lfs -text
38
  2_decode_INT4_128_fp16.onnx.data filter=lfs diff=lfs merge=lfs -text
39
  2_decode_INT4_128.onnx.data filter=lfs diff=lfs merge=lfs -text
 
 
 
37
  1_prefill_INT4_128.onnx.data filter=lfs diff=lfs merge=lfs -text
38
  2_decode_INT4_128_fp16.onnx.data filter=lfs diff=lfs merge=lfs -text
39
  2_decode_INT4_128.onnx.data filter=lfs diff=lfs merge=lfs -text
40
+ Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm_fp16.onnx.data filter=lfs diff=lfs merge=lfs -text
41
+ Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm.onnx.data filter=lfs diff=lfs merge=lfs -text
Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cbbe0179e5eba0e2d4f14d63066c02fd21e755eeb28ad8a34789fe4eb7e7f6f
3
+ size 1124755058
Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4253319ea723a8709f8a8d3d102580b3c969294782b01754bf843e67e2990063
3
+ size 1248559104
Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bad5ef4c44b2aeabfb54cbd395e9f48b675948f45f942bcb024c6eb55866a2c7
3
+ size 1066269131
Phi_3_mini_4k_instruct_decoder_static_kvcache_simplifiedlayernorm_fp16.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b39563b369c3bb31b0adaf1836f91008a2cc65ad68d2f50b3e0faf6fd36aae08
3
+ size 1051557888