diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" new file mode 100644--- /dev/null +++ "b/ndarray-cache.json" @@ -0,0 +1,5855 @@ +{ + "metadata": { + "ParamSize": 518 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 64552960, + "records": [ + { + "name": "param_0", + "shape": [ + 50432, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 64552960, + "byteOffset": 0 + } + ], + "md5sum": "01055e9fb1f7549b971a33d04611c34a" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 22876160, + "records": [ + { + "name": "param_1", + "shape": [ + 50432, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8069120, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 8069120 + }, + { + "name": "param_3", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 8079360 + }, + { + "name": "param_4", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 8089600 + }, + { + "name": "param_5", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 8099840 + }, + { + "name": "param_6", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 8110080 + }, + { + "name": "param_7", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 17940480 + }, + { + "name": "param_8", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 19169280 + }, + { + "name": "param_9", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 19184640 + }, + { + "name": "param_10", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 22461440 + }, + { + "name": "param_11", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 22871040 + } + ], + "md5sum": "7701496333979e8d77f274384d74e755" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_12", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_13", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_14", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_15", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_16", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_17", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_18", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_19", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_20", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_21", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "fb3d87b1e31e82f633c4d47bc0db0f72" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_22", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_23", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_24", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_25", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_26", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_27", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_28", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_29", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_30", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "45dc53d6231c6da77291bd6c3e549f45" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_31", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_32", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_33", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_34", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_35", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_36", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_37", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_38", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_39", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_40", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_41", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_42", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_43", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "37bd90ec38c3480245f929bceca2c861" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_44", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_45", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_46", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_47", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_48", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_49", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_50", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_51", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_52", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_53", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "49d45db0135273ae9b80e34fc2546e53" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_54", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_56", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_57", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_58", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_59", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_60", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_61", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_62", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "4ee34d0f74bea846c24397b4c5cd5e0f" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_63", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_64", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_65", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_66", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_67", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_68", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_69", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_70", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_71", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_72", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_73", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_74", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_75", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "b056fb0c3b5550ff3be4203f1c680772" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_76", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_77", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_78", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_79", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_80", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_81", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_82", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_83", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_84", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_85", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "a4e1746a777be6c1f3b526c0317435df" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_86", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_87", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_88", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_89", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_90", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_91", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_92", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_93", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_94", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "f0b0544635edefea7e91df7b1f7652d7" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_95", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_96", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_97", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_98", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_99", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_100", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_101", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_102", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_103", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_104", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_105", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_106", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_107", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "289e2f3af5b32bf6402ff56b55b727e1" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_108", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_109", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_110", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_111", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_112", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_113", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_114", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_115", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_116", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_117", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "81ce8227fb8c9a4c9adbd97f1f79c9c3" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_118", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_119", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_120", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_121", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_122", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_123", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_124", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_125", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_126", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "8c8fdb947265699eec076da763f8ad54" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_127", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_128", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_129", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_130", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_131", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_132", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_133", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_134", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_135", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_136", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_137", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_138", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_139", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "b3207d6bbdf067e9834b67868e23cd7e" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_140", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_141", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_142", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_143", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_144", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_145", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_146", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_147", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_148", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_149", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "edd181aafc7c04de14f6ae77a12b309c" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_150", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_151", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_152", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_153", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_154", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_155", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_156", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_157", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_158", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "54bf96834dd8e736c33dd98bdb7ff0de" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_159", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_160", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_161", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_162", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_163", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_164", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_165", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_166", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_167", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_168", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_169", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_170", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_171", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "6486da297ff945ffc439a4a1211abab6" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_172", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_173", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_174", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_175", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_176", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_177", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_178", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_179", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_180", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_181", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "106d0e65924dd417a3321763b6fb3b22" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_182", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_183", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_184", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_185", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_186", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_187", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_188", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_189", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_190", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "433e5934034a653cac6568a49845e2dc" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_191", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_192", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_193", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_194", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_195", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_196", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_197", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_198", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_199", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_200", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_201", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_202", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_203", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "b7aef16b0ccd66340ea525ae5efdd357" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_204", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_205", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_206", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_207", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_208", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_209", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_210", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_211", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_212", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_213", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "86cfcca6ed0fae450e6f51a3e39ada62" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_214", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_216", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_217", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_218", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_219", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_220", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_221", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_222", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "0d04df4e75fa8a93b302ee1fa39c9f45" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_223", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_224", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_225", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_226", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_227", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_228", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_229", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_230", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_231", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_232", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_233", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_234", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_235", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "348bd2342f3fdc86076e4f708ed8850c" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_236", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_237", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_238", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_239", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_240", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_241", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_242", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_243", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_244", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_245", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "88072a52129821885f77520b90e6d1cd" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_246", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_247", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_248", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_249", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_250", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_251", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_252", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_253", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_254", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "18a80f2c3bc21814b8eaadc8fbcac53f" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_255", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_256", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_257", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_258", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_259", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_260", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_261", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_262", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_263", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_264", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_265", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_266", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_267", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "c4847a9b00433619a9037d5628e09bad" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_268", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_269", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_270", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_271", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_272", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_273", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_274", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_275", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_276", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_277", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "fbbaaad1fc7a0005ef4ea78ef6e654b4" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_278", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_279", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_280", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_281", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_282", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_283", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_284", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_285", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_286", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "8e3a44396334ed65c5561aec24b7acb6" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_287", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_288", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_289", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_290", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_291", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_292", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_293", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_294", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_295", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_296", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_297", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_298", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_299", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "07029b3490a9e8d9a4fed7284d9f332e" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_300", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_301", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_302", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_303", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_304", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_305", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_306", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_307", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_308", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_309", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "8c299a77cd991862741f406c94c9e86c" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_310", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_311", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_312", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_313", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_314", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_315", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_316", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_317", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_318", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "05e896400a53fb02b46af36da40a75ba" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_319", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_320", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_321", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_322", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_323", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_324", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_325", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_326", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_327", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_328", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_329", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_330", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_331", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "df0cfcfb00232047a2af5244fae1df11" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_332", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_333", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_334", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_335", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_336", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_337", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_338", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_339", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_340", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_341", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "3a278a1ce1d4ba52b0ca38574f5fa28a" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_342", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_343", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_344", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_345", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_346", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_347", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_348", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_349", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_350", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "7331c4a7f616de94afa52dd1d9dba3a8" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_351", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_352", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_353", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_354", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_355", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_356", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_357", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_358", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_359", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_360", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_361", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_362", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_363", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "0b842d0db88df50c54e366231bfeb82b" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_364", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_365", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_366", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_367", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_368", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_369", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_370", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_371", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_372", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_373", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "6df85891caac5bf650a2075a37160328" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_374", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_375", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_376", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_377", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_378", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_379", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_380", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_381", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_382", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "26a7cbf49187ad776fe59226febc7fb7" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_383", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_384", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_385", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_386", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_387", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_388", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_389", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_390", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_391", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_392", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_393", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_394", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_395", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "c7bd7f983cd89008ff240757d2679568" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_396", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_397", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_398", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_399", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_400", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_401", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_402", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_403", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_404", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_405", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "195f549f1b25a347a471840345a05ec9" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_406", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_407", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_408", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_409", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_410", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_411", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_412", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_413", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_414", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "3107f769cae2eb2b7289656f51586399" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_415", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_416", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_417", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_418", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_419", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_420", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_421", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_422", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_423", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_424", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_425", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_426", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_427", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "96d4ecde627142edfd8c2dfc4f593a12" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_428", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_429", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_430", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_431", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_432", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_433", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_434", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_435", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_436", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_437", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "a347014c6fbd8443474aad967df11394" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_438", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_439", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_440", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_441", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_442", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_443", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_444", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_445", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_446", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "1e9138f272d90f33fd520ccf94f7f861" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_447", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_448", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_449", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_450", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_451", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_452", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_453", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_454", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_455", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_456", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_457", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_458", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_459", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "357c94342de47d2fec5f35a279cfca36" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_460", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_461", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_462", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_463", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_464", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_465", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_466", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_467", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_468", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_469", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "e9751d9f29c1f42d0d02017cc39d82f3" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_470", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_471", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_472", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_473", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_474", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_475", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_476", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_477", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_478", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "4420c4c1a2dfa55ae5e490a6825d9a99" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 29562880, + "records": [ + { + "name": "param_479", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_480", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_481", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_482", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_483", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_484", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14776320 + }, + { + "name": "param_485", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14786560 + }, + { + "name": "param_486", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 14796800 + }, + { + "name": "param_487", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24627200 + }, + { + "name": "param_488", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 25856000 + }, + { + "name": "param_489", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 25871360 + }, + { + "name": "param_490", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29148160 + }, + { + "name": "param_491", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 29557760 + } + ], + "md5sum": "2e8a6d21771e160ec336ff0b69e5632d" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 29583360, + "records": [ + { + "name": "param_492", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_493", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_494", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 14745600 + }, + { + "name": "param_495", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14786560 + }, + { + "name": "param_496", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27893760 + }, + { + "name": "param_497", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29532160 + }, + { + "name": "param_498", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29542400 + }, + { + "name": "param_499", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29552640 + }, + { + "name": "param_500", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29562880 + }, + { + "name": "param_501", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 29573120 + } + ], + "md5sum": "1df3255e7718b38e107083130c61150c" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 29552640, + "records": [ + { + "name": "param_502", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_503", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_504", + "shape": [ + 7680 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 15360, + "byteOffset": 11059200 + }, + { + "name": "param_505", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11074560 + }, + { + "name": "param_506", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14351360 + }, + { + "name": "param_507", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 14760960 + }, + { + "name": "param_508", + "shape": [ + 10240, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 14766080 + }, + { + "name": "param_509", + "shape": [ + 10240, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 27873280 + }, + { + "name": "param_510", + "shape": [ + 10240 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 40960, + "byteOffset": 29511680 + } + ], + "md5sum": "2ddb0502a5521fa34bb2d077ed0b065b" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 64552960, + "records": [ + { + "name": "param_516", + "shape": [ + 50432, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 64552960, + "byteOffset": 0 + } + ], + "md5sum": "25ea3e71fa498e95a5f1849d36ab9f50" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 30914560, + "records": [ + { + "name": "param_511", + "shape": [ + 2560, + 1280 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_512", + "shape": [ + 2560, + 320 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1638400, + "byteOffset": 13107200 + }, + { + "name": "param_513", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14745600 + }, + { + "name": "param_514", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14755840 + }, + { + "name": "param_515", + "shape": [ + 2560 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 10240, + "byteOffset": 14766080 + }, + { + "name": "param_517", + "shape": [ + 50432, + 80 + ], + "dtype": "float32", + "format": "raw", + "nbytes": 16138240, + "byteOffset": 14776320 + } + ], + "md5sum": "8cc7e97f7ca6086804efd499f1e5e71f" + } + ] +} \ No newline at end of file