diff --git a/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json b/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..fcd3efd50e62f9186cf1f3bb9e1969b7bc64d7bb --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/mlc-chat-config.json @@ -0,0 +1,16 @@ +{ + "model_lib": "stablelm-base-alpha-3b-q4f16_1", + "local_id": "stablelm-base-alpha-3b-q4f16_1", + "conv_template": "stablelm", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "tokenizer.model" + ], + "model_category": "gpt_neox", + "model_name": "stablelm-base-alpha-3b" +} \ No newline at end of file diff --git a/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl b/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d6e118c4ce7956e32f5fd53f0646fe8f1c9be767 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/mod_cache_before_build.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f733b226b425365c50eed8ab6e20360e53bffbbd4785fe71a7ee7e409542e312 +size 28616826 diff --git a/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json b/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..ca6f5f543bcf7cf1bc7107552127341ff5f6df59 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/ndarray-cache.json @@ -0,0 +1,5762 @@ +{ + "metadata": { + "ParamSize": 486 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 78643200, + "records": [ + { + "name": "param_0", + "shape": [ + 51200, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 78643200, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_12", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_15", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 33521664, + "records": [ + { + "name": "param_1", + "shape": [ + 51200, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 9830400 + }, + { + "name": "param_3", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 9842688 + }, + { + "name": "param_4", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 9854976 + }, + { + "name": "param_5", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 9867264 + }, + { + "name": "param_6", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 9879552 + }, + { + "name": "param_7", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 24035328 + }, + { + "name": "param_8", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 25804800 + }, + { + "name": "param_9", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 25823232 + }, + { + "name": "param_10", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 30541824 + }, + { + "name": "param_11", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 31131648 + }, + { + "name": "param_13", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 31137792 + }, + { + "name": "param_14", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 33497088 + } + ] + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_28", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_31", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 28471296, + "records": [ + { + "name": "param_16", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 0 + }, + { + "name": "param_17", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 2359296 + }, + { + "name": "param_18", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 2365440 + }, + { + "name": "param_19", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 2377728 + }, + { + "name": "param_20", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 2390016 + }, + { + "name": "param_21", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 2402304 + }, + { + "name": "param_22", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 2414592 + }, + { + "name": "param_23", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 16570368 + }, + { + "name": "param_24", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 18339840 + }, + { + "name": "param_25", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 18358272 + }, + { + "name": "param_26", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 23076864 + }, + { + "name": "param_27", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 23666688 + }, + { + "name": "param_29", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23672832 + }, + { + "name": "param_30", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 26032128 + }, + { + "name": "param_32", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 26056704 + }, + { + "name": "param_33", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 28416000 + }, + { + "name": "param_34", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 28422144 + }, + { + "name": "param_35", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 28434432 + }, + { + "name": "param_36", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 28446720 + }, + { + "name": "param_37", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 28459008 + } + ] + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_44", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_47", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_38", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_39", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_40", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_41", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_42", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_43", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_45", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_46", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_48", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_49", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_50", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_51", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_52", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_53", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_60", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_63", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_54", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_56", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_57", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_58", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_59", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_61", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_62", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_64", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_65", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_66", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_67", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_68", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_69", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_76", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_79", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_70", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_71", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_72", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_73", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_74", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_75", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_77", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_78", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_80", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_81", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_82", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_83", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_84", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_85", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_92", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_95", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_86", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_87", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_88", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_89", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_90", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_91", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_93", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_94", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_96", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_97", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_98", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_99", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_100", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_101", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_108", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_111", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_102", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_103", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_104", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_105", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_106", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_107", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_109", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_110", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_112", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_113", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_114", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_115", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_116", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_117", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_124", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_127", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_118", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_119", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_120", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_121", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_122", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_123", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_125", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_126", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_128", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_129", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_130", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_131", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_132", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_133", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_140", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_143", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_134", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_135", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_136", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_137", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_138", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_139", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_141", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_142", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_144", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_145", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_146", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_147", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_148", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_149", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_156", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_159", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_150", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_151", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_152", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_153", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_154", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_155", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_157", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_158", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_160", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_161", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_162", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_163", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_164", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_165", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_172", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_175", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_166", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_167", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_168", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_169", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_170", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_171", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_173", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_174", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_176", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_177", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_178", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_179", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_180", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_181", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_188", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_191", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_182", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_183", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_184", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_185", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_186", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_187", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_189", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_190", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_192", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_193", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_194", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_195", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_196", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_197", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_204", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_207", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_198", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_199", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_200", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_201", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_202", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_203", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_205", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_206", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_208", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_209", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_210", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_211", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_212", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_213", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_220", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_223", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_214", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_216", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_217", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_218", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_219", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_221", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_222", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_224", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_225", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_226", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_227", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_228", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_229", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_236", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_239", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_230", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_231", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_232", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_233", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_234", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_235", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_237", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_238", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_240", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_241", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_242", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_243", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_244", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_245", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_252", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_255", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_246", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_247", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_248", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_249", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_250", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_251", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_253", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_254", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_256", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_257", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_258", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_259", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_260", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_261", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_268", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_271", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_262", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_263", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_264", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_265", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_266", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_267", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_269", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_270", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_272", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_273", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_274", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_275", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_276", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_277", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_284", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_287", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_278", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_279", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_280", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_281", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_282", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_283", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_285", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_286", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_288", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_289", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_290", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_291", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_292", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_293", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_300", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_303", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_294", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_295", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_296", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_297", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_298", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_299", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_301", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_302", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_304", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_305", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_306", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_307", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_308", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_309", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_316", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_319", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_310", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_311", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_312", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_313", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_314", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_315", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_317", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_318", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_320", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_321", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_322", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_323", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_324", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_325", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_332", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_335", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_326", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_327", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_328", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_329", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_330", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_331", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_333", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_334", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_336", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_337", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_338", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_339", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_340", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_341", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_348", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_351", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_342", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_343", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_344", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_345", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_346", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_347", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_349", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_350", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_352", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_353", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_354", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_355", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_356", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_357", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_364", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_367", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_358", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_359", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_360", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_361", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_362", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_363", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_365", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_366", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_368", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_369", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_370", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_371", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_372", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_373", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_380", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_383", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_374", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_375", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_376", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_377", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_378", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_379", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_381", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_382", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_384", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_385", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_386", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_387", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_388", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_389", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_396", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_399", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_390", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_391", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_392", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_393", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_394", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_395", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_397", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_398", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_400", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_401", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_402", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_403", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_404", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_405", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_412", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_415", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_406", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_407", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_408", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_409", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_410", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_411", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_413", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_414", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_416", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_417", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_418", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_419", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_420", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_421", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_428", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_431", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_422", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_423", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_424", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_425", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_426", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_427", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_429", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_430", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_432", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_433", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_434", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_435", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_436", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_437", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_444", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_447", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_438", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_439", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_440", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_441", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_442", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_443", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_445", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_446", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_448", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_449", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_450", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_451", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_452", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_453", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_460", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_463", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 26056704, + "records": [ + { + "name": "param_454", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_455", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_456", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_457", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_458", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_459", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_461", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_462", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_464", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_465", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_466", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_467", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + }, + { + "name": "param_468", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26032128 + }, + { + "name": "param_469", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26044416 + } + ] + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_476", + "shape": [ + 12288, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "param_479", + "shape": [ + 3072, + 1536 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 18874368, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 78643200, + "records": [ + { + "name": "param_484", + "shape": [ + 51200, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 78643200, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_485", + "shape": [ + 51200, + 96 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 26032128, + "records": [ + { + "name": "param_470", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 0 + }, + { + "name": "param_471", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 14155776 + }, + { + "name": "param_472", + "shape": [ + 9216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 18432, + "byteOffset": 15925248 + }, + { + "name": "param_473", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 15943680 + }, + { + "name": "param_474", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 20662272 + }, + { + "name": "param_475", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 21252096 + }, + { + "name": "param_477", + "shape": [ + 12288, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 21258240 + }, + { + "name": "param_478", + "shape": [ + 12288 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 24576, + "byteOffset": 23617536 + }, + { + "name": "param_480", + "shape": [ + 3072, + 384 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2359296, + "byteOffset": 23642112 + }, + { + "name": "param_481", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 26001408 + }, + { + "name": "param_482", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26007552 + }, + { + "name": "param_483", + "shape": [ + 3072 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 12288, + "byteOffset": 26019840 + } + ] + } + ] +} \ No newline at end of file diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef097577fa5e71b40a1380363183e5ee23fb641f --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233c04c80bb731a2e382e236a7fb3f9fa6447d79a0d17dafe95112ad20c1c6e3 +size 78643200 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0d9287868ce4b8ae8bce0f4130bc86cd404b82b --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b0cd9e80f88f8445530a305c68d10221c4d541f08042a2513e38b351ab8cce2 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..3fd54b895a8aa58969b59c9e21ec0b07b973a2cd --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b575d3e64c5cd0cddaa1964010b9942cf45c7304bf357d68ff867c73fe82698d +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..666e7d0af8d8e54835ccab61c8aa6624d94ab440 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c75a82d298473985a2dcfb683f6f4a5c762fd2516cec9460f3285127a7d4ca7 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..c00880fb47d3d71f54cadcf4189e91f36abf6a54 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a90c6b84064682b2e1081ad0bfdd762c4bb5f0da18364be8afcacb22755af1a +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..347bc3b65a485f4805162983969b376ec1c948a3 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c63a791df3b4bfdb0ebaf279a0a70ee043a6c950864f685a01cffb04d79182 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..f832e1866896fd8c24ecffc36ad4dc8177329096 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3531219a76b56e7e38e047258f820a7f580d228d408e187f4ae7a3d2ae210c +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..e71df47bc7077c087bd80f5f28547e5762bb983b --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cfdf8e3b22414588ffe8e9ecedf6941c9f430a35da1f82e8588bd961dd3b8c2 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3ff5880b9424e4184edce047ec21190c12895c0 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0ea57bdbc86c4feec71c35f39b3ddabdd9d373d5b4bfa9132a112226b025c2 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..39119d6a4992eddef2e6a69d4d372cb381a34839 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c59daf3dc174248d7d1c347054f9b0df5efc2bfaeba80e3470512a47147ba8 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec8028e24d4820df6cb1128a3a7c5e35d5011760 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70cbb1650e34117c2b378dbc9af072fb25b4e3d0f7fe457b7ca282a2266af286 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..173861fbd03c073387a1214214dc47d9350f0a4e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aedd7bbbf63a277529e8fb2ab9ef9e5bdf3fc8587a5f946b761b3af741d514e +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..68461e155fc3ae75c77de435bb53859560ff231b --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f40e97b95ee8a1b23eadea6fdd1236a5273da34a98e1d5dbd76eca25319101 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..5532f79a622f78b87861157d044c9c8e6fbe60d8 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc9864aad11befdfed7bd632ef1b5c9b26c8628e71d23539e0ae50fdd072a7a8 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..308d8df31eb82aa04dcdb6f87bd8abb6ebcec46e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8eadc692f2d67ad61bc44bcba5f44770c11942784a8f380f23b80350297a9e +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd767902accede0997a9776e067f1cb3474c7b23 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5222fcf0d0eab695f22a89c77d853b235f7c1fb8dc891fe3bda96abf2764a487 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..db4eafe3fcf551e1b3ccfd7f8556700b759c4912 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0279e9eec57ff8846b189fdd9396f750035195890e1fb0423752bb52d9f45539 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd19162ba1363fa883e35446cd370240cf1141ea --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7be589147d827bcf14c5bf9c2c0e94c4167915a88ce478b79383f87f3916c5 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8836ec295052b4508e66e50c8bc05a83efd1fea --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb1f8cf0917b3045d09f5dc86cee418a47e4550e36068b6cafa36bef0ca2362e +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c012c9171c50f5cc040a6a131d872e14c212827 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325884c8ffe7e4d1106582f0e92ba3a6eae63f01344a84db4a5e97e64f2a8c89 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7fcf8a20d48e503f2b567e1cd7a7bd040366122 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d0d456c0575e1d8da407eaa4013203aa29aa62cb0e47052f198a314cea53f8 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..e66a94dd088bd97e9aa6c0c7f8addddc15554813 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00d6458a2d40e799bdad38086645f25d6f8d6505dfaa4b726bacd13bcb433e99 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..212e2fb2c30dce270722a9362e63b2e90ff3690e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41934a78cb977e50f006915ac928cd8bd54a9118b0bbcb51d4561f3d16f2dfc4 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..da0b419b6f20c629a05390eb0609470e51db7505 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623b7710ec072d4450d6f9c3597e255fc44523909627db0b3a5a69b850fc11c3 +size 33521664 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc41e8c5a8b4c5927952ecef270af3aa9467f055 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b32ac06f7e6fc70193fe9d4567b02367a595ce4387448ad59636e5e69036b2 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..24d5d21f05d6b0c38a55d2b9532eca4588a0516f --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c7159cd4388a16a204821c47f029c14dad3007a80d4fe9211d9234754bb0af +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d13a97f696b10bb5b01a3020cf7a1704545044d --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a33f5f6e52495b4ed4a9bb920569cb0ef26aa4840ab915a096712214be9f62 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..62d973d05d81110ba290e93b97f4cd4c9e045277 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894456d77a56cb9654fbe633349b33f52e836df20509ab4610db48f57f274135 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a5295e4884730efb629032ff34838bb294c4d3c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7af0d155c4321af2951c7a034911cea0cbfa10a0337be5e4bb449f2473aa16 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf52825ebae4ca68251595b3b53c9f2f6b56abad --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eaa8ee264eaf6c2a9aa0bf9053d6371339510325f64dcb275128769cb19f91d +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c7360ffed391a65e5cb40dd541a749ebc44d6f8 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf10fb29a5bcbe2eea5ce5a5e2e29d06e716421c9ee7299b795b1f1432e714c +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..0df97fbadba861c657d529099cd70a5d3063836a --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3889dc20bf19d2f053682c9d4d380e879fd429b18e1e599fea18b3e352f3bd0a +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..088fed44eada207ddd42ed2fc7ec2386c92448ac --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a7dae55e41a79d6dfa4f27f26c5e9c9c4c5cb8b788f6e073727bed3d2a81e6 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..c953adb1865282847035aa34c225b0b0869b9e9d --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57f24eab27f12ff4cd534b53cf5972cb7dfb6171c73ce79095aeec6e545c9d5 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..bba7ed3eccaabe3b8b8851be8f698f40268e3202 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893672be79b5200f95f2b83242b14c10d34cf6adb1eea4f7dc6d4a154ff2ea50 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..4274be54331cae56bc254db289109aaf9766d857 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4b8be3f41d5d813c10549f2b9a7a3a64299c7a1fc0d9c14f0e54ac20666a04 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1e7c8af0bdf3fd6285e78feede4c93d3d28c21d --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6619ca65a829c472fe9ef7f279d857704597528285d2371ec7cfcd3104fecb +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf2129fab84f66979402ad83eda9ec40e4e23b1c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36bf340aa196fd1dde70a54f87a63f725a3dabb5f475a82e6db3ec0002f3304f +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..469f822fe3f3916bbe8e5f1843888c8978aa7bed --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0354b9a9e2acac436c13e84466c87930d6191c91f7ee5fc5dcbfe75fdef94c +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebfeb3d1c2b95435bd10a7b0b254dbd6097f5160 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7d4682148bb60deb5e7f2d850897c572c09c336034a0bd68dd1237d0e34130 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..69ff0554706687c689dc141470ecc324c3939565 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13c8a825a6092e7a05bae1f1378b52f5c8d003a31d1cef2e44229ba7d4ca643 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..072d3ceddb3b9476df16e091f46a2cfa38637ba8 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e4312d8b290c78bd75d56ef5c46fd642a5642e85b6967e5c87e5e3be92ed68 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..e50a9595a83a1432c1b5fce5dc9b1855071c5f1c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ce040a0bea111b7326464e278f973839e4b15ad8c5c8f72356769ff4b5ae32 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..53e047a69dc737f79f9ba0987a12d442b8166c41 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e58813d2d46b5db6b725b9e49dd4275c78f35896e1d2eed4e1a8f428da6be2 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b833c3496a5ad28fbf5313c8dc8827edea208ad --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac5672d5a717c5bc7a3abdf645d9c7488dd20f070904574a9a45af4387943cf7 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d3e07e4ab5c71619c8c56a88f7d9063c580dc04 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7968b83a2584b14558ba293a27679043148295166890879b8263d488e1f927a1 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..d35b268108ed3af06ef33cef8c5d24d4348ad412 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a3fb75586ebcfd7846d1f9f6c59c0e211c728c4ee5c849a5eaa7900f626214 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d599bbfaf6790f5cf91468ff6f08327b4098998 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4711c4f967c6783ec50e5c5188aec1e8ec07775d79f7b2a1816e81e6cbab44a +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..84226d533b8bc6b50fd967bdd2f7d5d38ccdf2bc --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d287f2e2406e0d3f8a8a34d2d5abb607508c4dd3b6afad4e55af2d144ca20db +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..5671e18ea379cf563c9298b455e523e5129bfc5d --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a40d139f592cb452ce51448e15f297a15e774b7c66e7f9f42e0c2397597d22 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..50b939a001a87f9dc67101f8de2d5f596a2d5861 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b362434ed32a0329bf6f0b509f77dada37582d13088118508622ce68577779b3 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..0381027550c7a277aa35a20b99ca2557051fbf2c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8466cd15a8dbc38b59e47813e0caac3344aea48394ae592e83a4687bbd676ac6 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..de2bdf2464d2d7990dc99492692ab8371b1858ce --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890d72bd3bc9c976496a6f349bdf1cc6e56692f5d557e51074ab4680563bcfed +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..8f3eb0d56292809bbd892c0770606b47d5e6d9bf --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5b92f01536485ea34c92500b98d714c52a95e0627f757615c37b6082c735906 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d4f9b84a5794bb0907765c5d4b888c9c73c1a85 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f17aa96f4bac2588e53883918a8cb2196862d512b9c8390545c5f4fd55a1d35 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..6aba2b882e01c228ba78263dd0c0c2c6fd9914e9 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc40a283e7f10a47c3f4607018e6ce3477dd93ff74aea12baacaa3770b0bc21b +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6917448d89d330c8073cf08e7c81e481cca048b --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd14eb433e309a43596d638da0cda3ee8e0c572a9e9372ea9a5d2b338598cb2d +size 28471296 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf3b9a72521b7cdc4851147fae066f0dee6ba021 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d7b5f5b1717019a971af02648345b7441f54599ed4220724d6de5a0bc56340 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ca0ea9d716589a493fbf4e38e75ac24014be9b7 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a342205efa1b12d9d86bff655b64680ae02d3bc52c44e5c4f9a3d849a6d4e4a6 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..0be1446941c203dc7022ccb2bca0e00dce7e4e1e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8979a082b566767206f7118e9264e1b5c8a705ac770a042f03f8fbf3e0e0ec33 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..4857035891120d196588d9ffcafa8d9596ccd90e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8660c82ec74b00e908258b03d75b152c3077afd3d55cff34c277cc6d1e314f48 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..af1721db05699598222d4b1a766a5fbe4f553e68 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2906f23bedd4b664b38f446c53d5512ab9bfa9648c7252daf4b48b56f3e178f0 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..36d2a3f7c94c2bdd00e12961d28c8bc4e0974123 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abff508c24975491fa97768f553f1e6ae58db1e675061ac5dd75f32424b4b546 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..81cada79acaae1af19187f8104e76c2c6bc33415 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28e696f6885f11028c9fae251f9e5936220a233a9b4f538d23a0aa5164930cb +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..567c5fbdf56f50c2e20673a3e076a19a550f3426 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af4dff75cab5a9c4e76ced57cd7b8c85c2ffbf6e1c1d43264e1e1c04ea0dc15 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..264d7b110f41de07bac9a5eb0262fb68a54eebde --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb07f5e8dcf7a7c6ea455a65e06e58338633b8b96f894f0925c2ccdec2be009 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b9b562245f09e4e49a9b3969f730b8e74571bd5 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69880a5698105dcd4666e51ba7fe2dc6405ea5c799336a27aceb96044f0be111 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..bec6189043754a00fdfcd271998a5e4ffbf018fe --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9725ad77b33021740920024c738eb0143e0f5cbbbe8020f2aa579df8c22a6c14 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d6a21e4d1bcfb04951fb2005d34aea806bf15e1 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efbc24b59b11972dd66cc22872ae5c6afd701faa90a746eb1f980e737acac36 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..117b837a5d696cb7c3fbdc058ec67ffc2b300145 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e878bfd6b5a894b65776dee4039f20702657a21ccecac63ad4ada00ea1ce87e5 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8af6a1f068f141ddca6fbb3a20405c92cc69959 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b0c3d5dcd3aa3d8e79309c714ef58d9008b57861a5ee6193c28a0ec8a7d81d +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c0896d09a8742a7601a3ba01779a4969744876e --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:959b1c9126c8ce6c9e5f85e02b949ea63ace530411cbe53192e73543b4a8d430 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b49918e39945cec59c30b2cad7668a4906505e1 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e23d0e8cfcb46b74964a9dff0ab29ef55a4a24a9ef3b4524e22613c0f1c9526 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..c04fe7aefacbfe298cc94b9d94d06f36b0bdbe5f --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:567693a9168d6b37a1011a0813e6846684c00109f9105587d3a27f19e6d5fb21 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..7000bc2f106e8b5d5eeedb7ed0393300a9371562 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6686006c586e062bc1dcc75c3c9ae89b64ac876b5053fcf51aac15679576186 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..150b5bf7c838527212b54cfd982a1115b9f51e58 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27791b414d800b894bad144437fd294e001e8b9218dde454dccafe14a10f6d82 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..a924697a65f6b2479ec7b2774083448e71403a23 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae302dcbcae26534c186c0c391b9d525dc4ebe3b0e330b7afb9dde7e3a5f77e3 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0b0fb90738da486c1175e5e5678ffd2c348ae2b --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf06757c9ff47071948be0ed265b7e5652e3de382833544dfc7973b02492583 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..6003729c38d8fee0c8702f5cabbe96811f8ec8ca --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af1671d8b9accba2803ee59ffdf9bd1e911f6bbfab8540870ab79c3887f3845 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fa5e8926cf0cc2425fad21dcefd136d46fa35cf --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9765174ca405bd78d5c2d7af4e0936ebf387586fc3bf38449792a77ffa9b8dd +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..f74ed4ea854e680a133c9447440a4f74c7430060 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35fe8118732ca50c48f46a687edb0ea31bf69054f403b769fd68a5b3a4f4a79 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..e28da1ca0fa34f72b343dfd9e4a3eda4c89d2504 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329c8723b90c2d8142b68b9e1689a5d2651e218c998a03bc2abde7427db8f60c +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..907c158b8bfda3bd907280733b46f53678077600 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46f7d88cb9df65cf2092acc30e01d9654e50668f81af9d09a0eacfda4be37f1 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..21ca1f5e56109c58efb35ddf98e5be892c4a1308 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24ef6790b1f1a0f9eb0aa667441b52745441c60ae9800d79f20bc88715d4274 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..f92e33f888aba602fd7418da27ca198513ffece0 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502291798de0163125950c6be3e34674bb1515ad280b161d09f3ead33b75b46b +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..3385c5dc16b395c1598c610db106ff413fcaf829 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:712041f60a24516ed103508c70fa547a010694de1c7ae82e54b35b6ee189a686 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..704755e26a9f3201dc0b9ab4a8a90ec8d26ce811 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcba6d8a2776522d8a69700bb873c3b40458866f221394f1c0c3f164fb47469 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f8ed82724ce63b4a25b54dc4e455ae9b91ffb3f --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a917ce56f59569126a19ee596e6cb192fcf378f5e74b28c1b236528022c321 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a88e17f0f25bd7204112b858b34ebee344001c2 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be461efe8aad2c2b04bae124bcc3f322bdc5f54e8a5669fe541ded24d2b3d0b4 +size 18874368 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ab7a00461794ee01daf45ebdfb851df455caa37 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c003dfdba9157d206d6eabf401ccdd3131586a28bab0ec2af8a36886ae472f29 +size 26056704 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c3444fd4b7b05a265cfaeefb869584e85fc5641 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1272c2cb5d36d186748cf1b731cdde5abe246aa6b6c760bb282891f0bd07cfbc +size 78643200 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..39f23b3e4d579a47a9416175279214d38807242c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a32d3547d5d6eba99b915a3dcda012f31d28894d0f0dea64a3b1cbd3efd0311 +size 19660800 diff --git a/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin b/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..fce7c7a6db7a6389a85009c32fc63ff78dc95d9c --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc267cf9cc412bbe439a935a51a055e097e45b68b6a8e15b5e40a6769d327d1 +size 26032128 diff --git a/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm b/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm new file mode 100644 index 0000000000000000000000000000000000000000..15331e491aa41db7ff635a62b2475963c82a0e82 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/stablelm-base-alpha-3b-q4f16_1-webgpu.wasm @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212059a4389a79d5c0f77a6f8d01195bf0e8d8201740c33f7ef3f4189c1baf58 +size 4632214 diff --git a/stablelm-base-alpha-3b-q4f16_1/tokenizer.model b/stablelm-base-alpha-3b-q4f16_1/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..0075e65bd9a8aee12f483cb0b137cca9677798d8 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5c56a739832923347681ed8a03a9cbf5afb6d1fe60089a5b01dd2dd063ab71 +size 1208648 diff --git a/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json b/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..65fccae84e7e60a5f1ef5d9e110cc602c65b4928 --- /dev/null +++ b/stablelm-base-alpha-3b-q4f16_1/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "add_eos_token": true, + "additional_special_tokens": null, + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "do_lower_case": false, + "eos_token": "", + "extra_ids": 0, + "keep_accents": true, + "legacy": true, + "mask_token": "", + "model_max_length": 1000000000000000019884624838656, + "pad_token": "", + "sep_token": "", + "sp_model_kwargs": {}, + "tokenizer_class": "T5Tokenizer", + "unk_token": "" +}