Update NVFP4 with real allenai/c4 calibration (20260304-021249)
Browse files- .gitattributes +1 -0
- model-00001-of-00013.safetensors +1 -1
- model-00002-of-00013.safetensors +1 -1
- model-00003-of-00013.safetensors +1 -1
- model-00004-of-00013.safetensors +1 -1
- model-00005-of-00013.safetensors +1 -1
- model-00006-of-00013.safetensors +1 -1
- model-00007-of-00013.safetensors +1 -1
- model-00008-of-00013.safetensors +1 -1
- model-00009-of-00013.safetensors +1 -1
- model-00010-of-00013.safetensors +1 -1
- model-00011-of-00013.safetensors +1 -1
- model-00012-of-00013.safetensors +1 -1
- model-00013-of-00013.safetensors +1 -1
- spark_quantizer_provenance.json +4 -4
- tokenizer.json +0 -0
- tokenizer_config.json +1 -1
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
model-00001-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983536328
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:882691caff2eaa1451c4b79fc7deeeacca706317ca5b9ed08f25815bae38b117
|
| 3 |
size 4983536328
|
model-00002-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985162232
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:636f3a62f2d00b0d3f424ea7e9ec248cf72be456297784bfc61c042d6dca75b5
|
| 3 |
size 4985162232
|
model-00003-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985162624
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:787ed4b33bb36512fd03e2fc116992936457ad21279614299b8b9bf02ca431d5
|
| 3 |
size 4985162624
|
model-00004-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b60fb496240c9fa6b81ee2d8925cc6a8e962a834c8c80c4f20fc97040514f10
|
| 3 |
size 4985163840
|
model-00005-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0f79e50bba113e112837456d2855f11c695a26250da851a2418ddf6e3a9bff6
|
| 3 |
size 4985163840
|
model-00006-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75340cc52c9367fdd65c42f390fdfad07b0cd5fb813ee9cd9c7c3b34f2544689
|
| 3 |
size 4985163840
|
model-00007-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0952582b2d1921140c70524a3866b8e7e887ece094c2636f030a4833a83743a0
|
| 3 |
size 4985163840
|
model-00008-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f77ff79412d4a70f2f1e7cf586726568a071da08ef76a6efafdcc1122d18e9f
|
| 3 |
size 4985163840
|
model-00009-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9b1abf4b9a00c8eaa4654097d68cdaa73956fd2e29d05ad7f2b53f4af0e55a2
|
| 3 |
size 4985163840
|
model-00010-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be7d3d292e378bb03ee9c35f7aaf7ed95e711e4bd76681e0920ec45bfbafe0e5
|
| 3 |
size 4985163840
|
model-00011-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccba2f76d7ac2a8b9552f721572dc9bd21045eb1a567789cadce5da0b92bc5fa
|
| 3 |
size 4985163840
|
model-00012-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4985163840
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98e3929c8e278502b8bbd9269fcde850092d8e0de6ac1609f8496691676d842e
|
| 3 |
size 4985163840
|
model-00013-of-00013.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1246290440
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27d4c4e2ffe00b99ff9b48082fb045f520d0d59f301d6a46198b667ad17d6b8e
|
| 3 |
size 1246290440
|
spark_quantizer_provenance.json
CHANGED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
{
|
| 2 |
-
"source_model": "
|
| 3 |
"quantization": "NVFP4",
|
| 4 |
"tool": "nvidia-modelopt",
|
| 5 |
"export_method": "save_pretrained_manual",
|
| 6 |
"calib_size": 512,
|
| 7 |
-
"calib_dataset": "
|
| 8 |
"hardware": "NVIDIA GB10 (Blackwell)",
|
| 9 |
-
"offload_used":
|
| 10 |
-
"elapsed_sec":
|
| 11 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"source_model": "/hf_cache/hub/models--Qwen--Qwen3-Coder-30B-A3B-Instruct/snapshots/b2cff646eb4bb1d68355c01b18ae02e7cf42d120",
|
| 3 |
"quantization": "NVFP4",
|
| 4 |
"tool": "nvidia-modelopt",
|
| 5 |
"export_method": "save_pretrained_manual",
|
| 6 |
"calib_size": 512,
|
| 7 |
+
"calib_dataset": "allenai/c4",
|
| 8 |
"hardware": "NVIDIA GB10 (Blackwell)",
|
| 9 |
+
"offload_used": false,
|
| 10 |
+
"elapsed_sec": 267
|
| 11 |
}
|
tokenizer.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
CHANGED
|
@@ -20,7 +20,7 @@
|
|
| 20 |
"<|image_pad|>",
|
| 21 |
"<|video_pad|>"
|
| 22 |
],
|
| 23 |
-
"is_local":
|
| 24 |
"model_max_length": 1048576,
|
| 25 |
"pad_token": "<|endoftext|>",
|
| 26 |
"split_special_tokens": false,
|
|
|
|
| 20 |
"<|image_pad|>",
|
| 21 |
"<|video_pad|>"
|
| 22 |
],
|
| 23 |
+
"is_local": true,
|
| 24 |
"model_max_length": 1048576,
|
| 25 |
"pad_token": "<|endoftext|>",
|
| 26 |
"split_special_tokens": false,
|