diff --git a/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json b/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..fcd3efd50e62f9186cf1f3bb9e1969b7bc64d7bb
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json
@@ -0,0 +1,16 @@
+{
+ "model_lib": "stablelm-base-alpha-3b-q4f16_1",
+ "local_id": "stablelm-base-alpha-3b-q4f16_1",
+ "conv_template": "stablelm",
+ "temperature": 0.7,
+ "repetition_penalty": 1.0,
+ "top_p": 0.95,
+ "mean_gen_len": 128,
+ "max_gen_len": 512,
+ "shift_fill_factor": 0.3,
+ "tokenizer_files": [
+ "tokenizer.model"
+ ],
+ "model_category": "gpt_neox",
+ "model_name": "stablelm-base-alpha-3b"
+}
\ No newline at end of file
diff --git a/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl b/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..d6e118c4ce7956e32f5fd53f0646fe8f1c9be767
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f733b226b425365c50eed8ab6e20360e53bffbbd4785fe71a7ee7e409542e312
+size 28616826
diff --git a/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json b/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..ca6f5f543bcf7cf1bc7107552127341ff5f6df59
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json
@@ -0,0 +1,5762 @@
+{
+ "metadata": {
+ "ParamSize": 486
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 78643200,
+ "records": [
+ {
+ "name": "param_0",
+ "shape": [
+ 51200,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 78643200,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_12",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_15",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 33521664,
+ "records": [
+ {
+ "name": "param_1",
+ "shape": [
+ 51200,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 9830400,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_2",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_3",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 9842688
+ },
+ {
+ "name": "param_4",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 9854976
+ },
+ {
+ "name": "param_5",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 9867264
+ },
+ {
+ "name": "param_6",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 9879552
+ },
+ {
+ "name": "param_7",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 24035328
+ },
+ {
+ "name": "param_8",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 25804800
+ },
+ {
+ "name": "param_9",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 25823232
+ },
+ {
+ "name": "param_10",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 30541824
+ },
+ {
+ "name": "param_11",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 31131648
+ },
+ {
+ "name": "param_13",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 31137792
+ },
+ {
+ "name": "param_14",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 33497088
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_28",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_31",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 28471296,
+ "records": [
+ {
+ "name": "param_16",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_17",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 2359296
+ },
+ {
+ "name": "param_18",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 2365440
+ },
+ {
+ "name": "param_19",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 2377728
+ },
+ {
+ "name": "param_20",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 2390016
+ },
+ {
+ "name": "param_21",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 2402304
+ },
+ {
+ "name": "param_22",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 2414592
+ },
+ {
+ "name": "param_23",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 16570368
+ },
+ {
+ "name": "param_24",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 18339840
+ },
+ {
+ "name": "param_25",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 18358272
+ },
+ {
+ "name": "param_26",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 23076864
+ },
+ {
+ "name": "param_27",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 23666688
+ },
+ {
+ "name": "param_29",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23672832
+ },
+ {
+ "name": "param_30",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_32",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 26056704
+ },
+ {
+ "name": "param_33",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 28416000
+ },
+ {
+ "name": "param_34",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 28422144
+ },
+ {
+ "name": "param_35",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 28434432
+ },
+ {
+ "name": "param_36",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 28446720
+ },
+ {
+ "name": "param_37",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 28459008
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_44",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_47",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_38",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_39",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_40",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_41",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_42",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_43",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_45",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_46",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_48",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_49",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_50",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_51",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_52",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_53",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_60",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_63",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_54",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_55",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_56",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_57",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_58",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_59",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_61",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_62",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_64",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_65",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_66",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_67",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_68",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_69",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_76",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_79",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_70",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_71",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_72",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_73",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_74",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_75",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_77",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_78",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_80",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_81",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_82",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_83",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_84",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_85",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_92",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_95",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_86",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_87",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_88",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_89",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_90",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_91",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_93",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_94",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_96",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_97",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_98",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_99",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_100",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_101",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_108",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_111",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_102",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_103",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_104",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_105",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_106",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_107",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_109",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_110",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_112",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_113",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_114",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_115",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_116",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_117",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_124",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_127",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_118",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_119",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_120",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_121",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_122",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_123",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_125",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_126",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_128",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_129",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_130",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_131",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_132",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_133",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_140",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_143",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_134",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_135",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_136",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_137",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_138",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_139",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_141",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_142",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_144",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_145",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_146",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_147",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_148",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_149",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_156",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_159",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_150",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_151",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_152",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_153",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_154",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_155",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_157",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_158",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_160",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_161",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_162",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_163",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_164",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_165",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_172",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_175",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_166",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_167",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_168",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_169",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_170",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_171",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_173",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_174",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_176",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_177",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_178",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_179",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_180",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_181",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_188",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_191",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_182",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_183",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_184",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_185",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_186",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_187",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_189",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_190",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_192",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_193",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_194",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_195",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_196",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_197",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_204",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_207",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_198",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_199",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_200",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_201",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_202",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_203",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_205",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_206",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_208",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_209",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_210",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_211",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_212",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_213",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_220",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_223",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_214",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_215",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_216",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_217",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_218",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_219",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_221",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_222",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_224",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_225",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_226",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_227",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_228",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_229",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_236",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_239",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_230",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_231",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_232",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_233",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_234",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_235",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_237",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_238",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_240",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_241",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_242",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_243",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_244",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_245",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_252",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_255",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_246",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_247",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_248",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_249",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_250",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_251",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_253",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_254",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_256",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_257",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_258",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_259",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_260",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_261",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_268",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_271",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_262",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_263",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_264",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_265",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_266",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_267",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_269",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_270",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_272",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_273",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_274",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_275",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_276",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_277",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_284",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_287",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_278",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_279",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_280",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_281",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_282",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_283",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_285",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_286",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_288",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_289",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_290",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_291",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_292",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_293",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_300",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_303",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_294",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_295",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_296",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_297",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_298",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_299",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_301",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_302",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_304",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_305",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_306",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_307",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_308",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_309",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_316",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_319",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_310",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_311",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_312",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_313",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_314",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_315",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_317",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_318",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_320",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_321",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_322",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_323",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_324",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_325",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_332",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_335",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_326",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_327",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_328",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_329",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_330",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_331",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_333",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_334",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_336",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_337",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_338",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_339",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_340",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_341",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_348",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_351",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_342",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_343",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_344",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_345",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_346",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_347",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_349",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_350",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_352",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_353",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_354",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_355",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_356",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_357",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_364",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_367",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_358",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_359",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_360",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_361",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_362",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_363",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_365",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_366",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_368",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_369",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_370",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_371",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_372",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_373",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_380",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_383",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_374",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_375",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_376",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_377",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_378",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_379",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_381",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_382",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_384",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_385",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_386",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_387",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_388",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_389",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_396",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_399",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_390",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_391",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_392",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_393",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_394",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_395",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_397",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_398",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_400",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_401",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_402",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_403",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_404",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_405",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_412",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_415",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_406",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_407",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_408",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_409",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_410",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_411",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_413",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_414",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_416",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_417",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_418",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_419",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_420",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_421",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_428",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_431",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_422",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_423",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_424",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_425",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_426",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_427",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_429",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_430",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_432",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_433",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_434",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_435",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_436",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_437",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_444",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_447",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_438",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_439",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_440",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_441",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_442",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_443",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_445",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_446",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_448",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_449",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_450",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_451",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_452",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_453",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_460",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_463",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 26056704,
+ "records": [
+ {
+ "name": "param_454",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_455",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_456",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_457",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_458",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_459",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_461",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_462",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_464",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_465",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_466",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_467",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ },
+ {
+ "name": "param_468",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26032128
+ },
+ {
+ "name": "param_469",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26044416
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_476",
+ "shape": [
+ 12288,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 18874368,
+ "records": [
+ {
+ "name": "param_479",
+ "shape": [
+ 3072,
+ 1536
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 18874368,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 78643200,
+ "records": [
+ {
+ "name": "param_484",
+ "shape": [
+ 51200,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 78643200,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_485",
+ "shape": [
+ 51200,
+ 96
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 26032128,
+ "records": [
+ {
+ "name": "param_470",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_471",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 14155776
+ },
+ {
+ "name": "param_472",
+ "shape": [
+ 9216
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 18432,
+ "byteOffset": 15925248
+ },
+ {
+ "name": "param_473",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 15943680
+ },
+ {
+ "name": "param_474",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 20662272
+ },
+ {
+ "name": "param_475",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 21252096
+ },
+ {
+ "name": "param_477",
+ "shape": [
+ 12288,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 21258240
+ },
+ {
+ "name": "param_478",
+ "shape": [
+ 12288
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 24576,
+ "byteOffset": 23617536
+ },
+ {
+ "name": "param_480",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2359296,
+ "byteOffset": 23642112
+ },
+ {
+ "name": "param_481",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 26001408
+ },
+ {
+ "name": "param_482",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26007552
+ },
+ {
+ "name": "param_483",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float32",
+ "format": "raw",
+ "nbytes": 12288,
+ "byteOffset": 26019840
+ }
+ ]
+ }
+ ]
+}
\ No newline at end of file
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef097577fa5e71b40a1380363183e5ee23fb641f
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:233c04c80bb731a2e382e236a7fb3f9fa6447d79a0d17dafe95112ad20c1c6e3
+size 78643200
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b0d9287868ce4b8ae8bce0f4130bc86cd404b82b
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7b0cd9e80f88f8445530a305c68d10221c4d541f08042a2513e38b351ab8cce2
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3fd54b895a8aa58969b59c9e21ec0b07b973a2cd
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b575d3e64c5cd0cddaa1964010b9942cf45c7304bf357d68ff867c73fe82698d
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..666e7d0af8d8e54835ccab61c8aa6624d94ab440
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c75a82d298473985a2dcfb683f6f4a5c762fd2516cec9460f3285127a7d4ca7
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c00880fb47d3d71f54cadcf4189e91f36abf6a54
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a90c6b84064682b2e1081ad0bfdd762c4bb5f0da18364be8afcacb22755af1a
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..347bc3b65a485f4805162983969b376ec1c948a3
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4c63a791df3b4bfdb0ebaf279a0a70ee043a6c950864f685a01cffb04d79182
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f832e1866896fd8c24ecffc36ad4dc8177329096
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb3531219a76b56e7e38e047258f820a7f580d228d408e187f4ae7a3d2ae210c
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e71df47bc7077c087bd80f5f28547e5762bb983b
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2cfdf8e3b22414588ffe8e9ecedf6941c9f430a35da1f82e8588bd961dd3b8c2
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3ff5880b9424e4184edce047ec21190c12895c0
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d0ea57bdbc86c4feec71c35f39b3ddabdd9d373d5b4bfa9132a112226b025c2
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..39119d6a4992eddef2e6a69d4d372cb381a34839
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d7c59daf3dc174248d7d1c347054f9b0df5efc2bfaeba80e3470512a47147ba8
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec8028e24d4820df6cb1128a3a7c5e35d5011760
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70cbb1650e34117c2b378dbc9af072fb25b4e3d0f7fe457b7ca282a2266af286
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..173861fbd03c073387a1214214dc47d9350f0a4e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8aedd7bbbf63a277529e8fb2ab9ef9e5bdf3fc8587a5f946b761b3af741d514e
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..68461e155fc3ae75c77de435bb53859560ff231b
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41f40e97b95ee8a1b23eadea6fdd1236a5273da34a98e1d5dbd76eca25319101
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5532f79a622f78b87861157d044c9c8e6fbe60d8
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dc9864aad11befdfed7bd632ef1b5c9b26c8628e71d23539e0ae50fdd072a7a8
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..308d8df31eb82aa04dcdb6f87bd8abb6ebcec46e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c8eadc692f2d67ad61bc44bcba5f44770c11942784a8f380f23b80350297a9e
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd767902accede0997a9776e067f1cb3474c7b23
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5222fcf0d0eab695f22a89c77d853b235f7c1fb8dc891fe3bda96abf2764a487
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..db4eafe3fcf551e1b3ccfd7f8556700b759c4912
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0279e9eec57ff8846b189fdd9396f750035195890e1fb0423752bb52d9f45539
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd19162ba1363fa883e35446cd370240cf1141ea
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a7be589147d827bcf14c5bf9c2c0e94c4167915a88ce478b79383f87f3916c5
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b8836ec295052b4508e66e50c8bc05a83efd1fea
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb1f8cf0917b3045d09f5dc86cee418a47e4550e36068b6cafa36bef0ca2362e
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c012c9171c50f5cc040a6a131d872e14c212827
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:325884c8ffe7e4d1106582f0e92ba3a6eae63f01344a84db4a5e97e64f2a8c89
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7fcf8a20d48e503f2b567e1cd7a7bd040366122
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54d0d456c0575e1d8da407eaa4013203aa29aa62cb0e47052f198a314cea53f8
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e66a94dd088bd97e9aa6c0c7f8addddc15554813
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00d6458a2d40e799bdad38086645f25d6f8d6505dfaa4b726bacd13bcb433e99
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..212e2fb2c30dce270722a9362e63b2e90ff3690e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41934a78cb977e50f006915ac928cd8bd54a9118b0bbcb51d4561f3d16f2dfc4
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da0b419b6f20c629a05390eb0609470e51db7505
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:623b7710ec072d4450d6f9c3597e255fc44523909627db0b3a5a69b850fc11c3
+size 33521664
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc41e8c5a8b4c5927952ecef270af3aa9467f055
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4b32ac06f7e6fc70193fe9d4567b02367a595ce4387448ad59636e5e69036b2
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..24d5d21f05d6b0c38a55d2b9532eca4588a0516f
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0c7159cd4388a16a204821c47f029c14dad3007a80d4fe9211d9234754bb0af
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d13a97f696b10bb5b01a3020cf7a1704545044d
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7a33f5f6e52495b4ed4a9bb920569cb0ef26aa4840ab915a096712214be9f62
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..62d973d05d81110ba290e93b97f4cd4c9e045277
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:894456d77a56cb9654fbe633349b33f52e836df20509ab4610db48f57f274135
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a5295e4884730efb629032ff34838bb294c4d3c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da7af0d155c4321af2951c7a034911cea0cbfa10a0337be5e4bb449f2473aa16
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf52825ebae4ca68251595b3b53c9f2f6b56abad
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4eaa8ee264eaf6c2a9aa0bf9053d6371339510325f64dcb275128769cb19f91d
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8c7360ffed391a65e5cb40dd541a749ebc44d6f8
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:abf10fb29a5bcbe2eea5ce5a5e2e29d06e716421c9ee7299b795b1f1432e714c
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0df97fbadba861c657d529099cd70a5d3063836a
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3889dc20bf19d2f053682c9d4d380e879fd429b18e1e599fea18b3e352f3bd0a
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..088fed44eada207ddd42ed2fc7ec2386c92448ac
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85a7dae55e41a79d6dfa4f27f26c5e9c9c4c5cb8b788f6e073727bed3d2a81e6
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c953adb1865282847035aa34c225b0b0869b9e9d
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f57f24eab27f12ff4cd534b53cf5972cb7dfb6171c73ce79095aeec6e545c9d5
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bba7ed3eccaabe3b8b8851be8f698f40268e3202
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:893672be79b5200f95f2b83242b14c10d34cf6adb1eea4f7dc6d4a154ff2ea50
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4274be54331cae56bc254db289109aaf9766d857
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c4b8be3f41d5d813c10549f2b9a7a3a64299c7a1fc0d9c14f0e54ac20666a04
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e1e7c8af0bdf3fd6285e78feede4c93d3d28c21d
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c6619ca65a829c472fe9ef7f279d857704597528285d2371ec7cfcd3104fecb
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf2129fab84f66979402ad83eda9ec40e4e23b1c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36bf340aa196fd1dde70a54f87a63f725a3dabb5f475a82e6db3ec0002f3304f
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..469f822fe3f3916bbe8e5f1843888c8978aa7bed
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f0354b9a9e2acac436c13e84466c87930d6191c91f7ee5fc5dcbfe75fdef94c
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ebfeb3d1c2b95435bd10a7b0b254dbd6097f5160
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0b7d4682148bb60deb5e7f2d850897c572c09c336034a0bd68dd1237d0e34130
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..69ff0554706687c689dc141470ecc324c3939565
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c13c8a825a6092e7a05bae1f1378b52f5c8d003a31d1cef2e44229ba7d4ca643
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..072d3ceddb3b9476df16e091f46a2cfa38637ba8
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3e4312d8b290c78bd75d56ef5c46fd642a5642e85b6967e5c87e5e3be92ed68
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e50a9595a83a1432c1b5fce5dc9b1855071c5f1c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4ce040a0bea111b7326464e278f973839e4b15ad8c5c8f72356769ff4b5ae32
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53e047a69dc737f79f9ba0987a12d442b8166c41
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48e58813d2d46b5db6b725b9e49dd4275c78f35896e1d2eed4e1a8f428da6be2
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b833c3496a5ad28fbf5313c8dc8827edea208ad
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ac5672d5a717c5bc7a3abdf645d9c7488dd20f070904574a9a45af4387943cf7
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d3e07e4ab5c71619c8c56a88f7d9063c580dc04
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7968b83a2584b14558ba293a27679043148295166890879b8263d488e1f927a1
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d35b268108ed3af06ef33cef8c5d24d4348ad412
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39a3fb75586ebcfd7846d1f9f6c59c0e211c728c4ee5c849a5eaa7900f626214
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8d599bbfaf6790f5cf91468ff6f08327b4098998
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4711c4f967c6783ec50e5c5188aec1e8ec07775d79f7b2a1816e81e6cbab44a
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..84226d533b8bc6b50fd967bdd2f7d5d38ccdf2bc
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d287f2e2406e0d3f8a8a34d2d5abb607508c4dd3b6afad4e55af2d144ca20db
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5671e18ea379cf563c9298b455e523e5129bfc5d
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5a40d139f592cb452ce51448e15f297a15e774b7c66e7f9f42e0c2397597d22
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..50b939a001a87f9dc67101f8de2d5f596a2d5861
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b362434ed32a0329bf6f0b509f77dada37582d13088118508622ce68577779b3
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0381027550c7a277aa35a20b99ca2557051fbf2c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8466cd15a8dbc38b59e47813e0caac3344aea48394ae592e83a4687bbd676ac6
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de2bdf2464d2d7990dc99492692ab8371b1858ce
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:890d72bd3bc9c976496a6f349bdf1cc6e56692f5d557e51074ab4680563bcfed
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f3eb0d56292809bbd892c0770606b47d5e6d9bf
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a5b92f01536485ea34c92500b98d714c52a95e0627f757615c37b6082c735906
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d4f9b84a5794bb0907765c5d4b888c9c73c1a85
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f17aa96f4bac2588e53883918a8cb2196862d512b9c8390545c5f4fd55a1d35
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6aba2b882e01c228ba78263dd0c0c2c6fd9914e9
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dc40a283e7f10a47c3f4607018e6ce3477dd93ff74aea12baacaa3770b0bc21b
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6917448d89d330c8073cf08e7c81e481cca048b
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd14eb433e309a43596d638da0cda3ee8e0c572a9e9372ea9a5d2b338598cb2d
+size 28471296
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf3b9a72521b7cdc4851147fae066f0dee6ba021
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02d7b5f5b1717019a971af02648345b7441f54599ed4220724d6de5a0bc56340
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ca0ea9d716589a493fbf4e38e75ac24014be9b7
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a342205efa1b12d9d86bff655b64680ae02d3bc52c44e5c4f9a3d849a6d4e4a6
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0be1446941c203dc7022ccb2bca0e00dce7e4e1e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8979a082b566767206f7118e9264e1b5c8a705ac770a042f03f8fbf3e0e0ec33
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4857035891120d196588d9ffcafa8d9596ccd90e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8660c82ec74b00e908258b03d75b152c3077afd3d55cff34c277cc6d1e314f48
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af1721db05699598222d4b1a766a5fbe4f553e68
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2906f23bedd4b664b38f446c53d5512ab9bfa9648c7252daf4b48b56f3e178f0
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36d2a3f7c94c2bdd00e12961d28c8bc4e0974123
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:abff508c24975491fa97768f553f1e6ae58db1e675061ac5dd75f32424b4b546
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..81cada79acaae1af19187f8104e76c2c6bc33415
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e28e696f6885f11028c9fae251f9e5936220a233a9b4f538d23a0aa5164930cb
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..567c5fbdf56f50c2e20673a3e076a19a550f3426
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6af4dff75cab5a9c4e76ced57cd7b8c85c2ffbf6e1c1d43264e1e1c04ea0dc15
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..264d7b110f41de07bac9a5eb0262fb68a54eebde
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4cb07f5e8dcf7a7c6ea455a65e06e58338633b8b96f894f0925c2ccdec2be009
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b9b562245f09e4e49a9b3969f730b8e74571bd5
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69880a5698105dcd4666e51ba7fe2dc6405ea5c799336a27aceb96044f0be111
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bec6189043754a00fdfcd271998a5e4ffbf018fe
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9725ad77b33021740920024c738eb0143e0f5cbbbe8020f2aa579df8c22a6c14
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d6a21e4d1bcfb04951fb2005d34aea806bf15e1
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7efbc24b59b11972dd66cc22872ae5c6afd701faa90a746eb1f980e737acac36
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..117b837a5d696cb7c3fbdc058ec67ffc2b300145
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e878bfd6b5a894b65776dee4039f20702657a21ccecac63ad4ada00ea1ce87e5
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8af6a1f068f141ddca6fbb3a20405c92cc69959
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76b0c3d5dcd3aa3d8e79309c714ef58d9008b57861a5ee6193c28a0ec8a7d81d
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c0896d09a8742a7601a3ba01779a4969744876e
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:959b1c9126c8ce6c9e5f85e02b949ea63ace530411cbe53192e73543b4a8d430
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b49918e39945cec59c30b2cad7668a4906505e1
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e23d0e8cfcb46b74964a9dff0ab29ef55a4a24a9ef3b4524e22613c0f1c9526
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c04fe7aefacbfe298cc94b9d94d06f36b0bdbe5f
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:567693a9168d6b37a1011a0813e6846684c00109f9105587d3a27f19e6d5fb21
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7000bc2f106e8b5d5eeedb7ed0393300a9371562
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6686006c586e062bc1dcc75c3c9ae89b64ac876b5053fcf51aac15679576186
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..150b5bf7c838527212b54cfd982a1115b9f51e58
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27791b414d800b894bad144437fd294e001e8b9218dde454dccafe14a10f6d82
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a924697a65f6b2479ec7b2774083448e71403a23
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae302dcbcae26534c186c0c391b9d525dc4ebe3b0e330b7afb9dde7e3a5f77e3
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d0b0fb90738da486c1175e5e5678ffd2c348ae2b
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6bf06757c9ff47071948be0ed265b7e5652e3de382833544dfc7973b02492583
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6003729c38d8fee0c8702f5cabbe96811f8ec8ca
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9af1671d8b9accba2803ee59ffdf9bd1e911f6bbfab8540870ab79c3887f3845
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9fa5e8926cf0cc2425fad21dcefd136d46fa35cf
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d9765174ca405bd78d5c2d7af4e0936ebf387586fc3bf38449792a77ffa9b8dd
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f74ed4ea854e680a133c9447440a4f74c7430060
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a35fe8118732ca50c48f46a687edb0ea31bf69054f403b769fd68a5b3a4f4a79
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e28da1ca0fa34f72b343dfd9e4a3eda4c89d2504
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:329c8723b90c2d8142b68b9e1689a5d2651e218c998a03bc2abde7427db8f60c
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..907c158b8bfda3bd907280733b46f53678077600
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a46f7d88cb9df65cf2092acc30e01d9654e50668f81af9d09a0eacfda4be37f1
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..21ca1f5e56109c58efb35ddf98e5be892c4a1308
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c24ef6790b1f1a0f9eb0aa667441b52745441c60ae9800d79f20bc88715d4274
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f92e33f888aba602fd7418da27ca198513ffece0
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:502291798de0163125950c6be3e34674bb1515ad280b161d09f3ead33b75b46b
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3385c5dc16b395c1598c610db106ff413fcaf829
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:712041f60a24516ed103508c70fa547a010694de1c7ae82e54b35b6ee189a686
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..704755e26a9f3201dc0b9ab4a8a90ec8d26ce811
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ebcba6d8a2776522d8a69700bb873c3b40458866f221394f1c0c3f164fb47469
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f8ed82724ce63b4a25b54dc4e455ae9b91ffb3f
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25a917ce56f59569126a19ee596e6cb192fcf378f5e74b28c1b236528022c321
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a88e17f0f25bd7204112b858b34ebee344001c2
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be461efe8aad2c2b04bae124bcc3f322bdc5f54e8a5669fe541ded24d2b3d0b4
+size 18874368
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ab7a00461794ee01daf45ebdfb851df455caa37
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c003dfdba9157d206d6eabf401ccdd3131586a28bab0ec2af8a36886ae472f29
+size 26056704
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c3444fd4b7b05a265cfaeefb869584e85fc5641
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1272c2cb5d36d186748cf1b731cdde5abe246aa6b6c760bb282891f0bd07cfbc
+size 78643200
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..39f23b3e4d579a47a9416175279214d38807242c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a32d3547d5d6eba99b915a3dcda012f31d28894d0f0dea64a3b1cbd3efd0311
+size 19660800
diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fce7c7a6db7a6389a85009c32fc63ff78dc95d9c
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ebc267cf9cc412bbe439a935a51a055e097e45b68b6a8e15b5e40a6769d327d1
+size 26032128
diff --git a/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm b/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm
new file mode 100644
index 0000000000000000000000000000000000000000..15331e491aa41db7ff635a62b2475963c82a0e82
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:212059a4389a79d5c0f77a6f8d01195bf0e8d8201740c33f7ef3f4189c1baf58
+size 4632214
diff --git a/stablelm-base-alpha-3b-q4f16_1/tokenizer.model b/stablelm-base-alpha-3b-q4f16_1/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..0075e65bd9a8aee12f483cb0b137cca9677798d8
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c5c56a739832923347681ed8a03a9cbf5afb6d1fe60089a5b01dd2dd063ab71
+size 1208648
diff --git a/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json b/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..65fccae84e7e60a5f1ef5d9e110cc602c65b4928
--- /dev/null
+++ b/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "add_eos_token": true,
+ "additional_special_tokens": null,
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "do_lower_case": false,
+ "eos_token": "",
+ "extra_ids": 0,
+ "keep_accents": true,
+ "legacy": true,
+ "mask_token": "",
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": "",
+ "sep_token": "",
+ "sp_model_kwargs": {},
+ "tokenizer_class": "T5Tokenizer",
+ "unk_token": ""
+}