diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..8144e623e9298c082a738681d9e77f1b0b973edc --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,7105 @@ +{ + "metadata": { + "ParamSize": 443, + "ParamBytes": 19677200384.0, + "BitsPerParam": 4.500110418416715 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 1048576000, + "records": [ + { + "name": "model.embed_tokens.q_weight", + "shape": [ + 256000, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 1048576000, + "byteOffset": 0 + } + ], + "md5sum": "90172f952317e27f8f3eadb8a833b298" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 131072000, + "records": [ + { + "name": "model.embed_tokens.q_scale", + "shape": [ + 256000, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 131072000, + "byteOffset": 0 + } + ], + "md5sum": "a15f399df006c9452a99a41845042bca" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "5f738e519bc173b908b7cd18431c29e8" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.0.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "d32a88c4601b719449740f9e4e0ec941" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "fa29ce568dff5f9093b97edb9a4e42ee" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.0.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "311ea3067bb11bd40f2fb3df606135b3" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.0.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.0.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "0bf412fdfd72cfe1bbe6c3e9babc5fe5" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.0.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "daaa92d0e8d1c22da6c49bca7992bcdd" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "52ed1c455e6231bb1d81efc8ea1ccd20" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.0.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.0.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "74bab5694c593c28b3305c6f25768503" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.1.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "32b73b10039081fcda2e8f03ead6841c" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.1.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "4af8ca8a3cfa630d59f3f21bbf769681" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.1.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "eeedbe99ab0d2825106928c56b3a36e3" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2cec07be2d0ca19654e2d98fa7eca397" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.1.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "66a5b3602033eb9a585e85c9c9430520" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c45f3c013b5fa9bc1bd2dca375ac79f3" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.1.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.1.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.1.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "6df0a68f5dc645329ec73c6f53dbec14" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.2.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c48b9cbad61ecfde89049ccb16ceeaca" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.2.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "df885a3f12a59d21a57b271cd425450e" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.2.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "8a43afbc46b4f47643b80ec2f270aea9" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a89395d538137c2626af121c3e309327" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.2.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c0225bde45c596864953614f93c7c4b1" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "08b2f4ac06f8ae1ec6f75acf158bb21f" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.2.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.2.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.2.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "78cd23ae9f746a2cca8764a440006b68" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.3.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a440a398a39fccfb6bc529d1c5238962" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "ea9073c5f186702d27103febbc03b2db" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.10.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "cd6000f8526794813876bee9d86854a2" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.3.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.10.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "2dcdc81c2dc2c48166f0f312265177b9" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.10.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "3e0eada4d26c11bf3ecc02c90371a904" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f610ece4bebf2bda87662f1646b748c2" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.10.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.10.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "f923c1c3c2a9915f5ae3fc13f2f74d81" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.10.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "174ca52dbbff01c7ec2c9b1a251447cd" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "ae39caa4431c35187ab3dfc0e60c328c" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.11.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "08e177080ce65b8e4ada20b0ff6340be" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.10.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.11.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "491c25bdf1f29a3ba8cc469171e9b03a" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.11.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "ba51df0a15d17f72950c3f8508ff6d4f" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ee158e48976b0a4f752ea621af2eefe8" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.11.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.11.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "2e678b14a9b535566e914ce283aed8c5" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.11.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "630bf903d2b3fc6792fcd06a0fa8a023" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "cf1807b062ead015ab356cb5d10162fe" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.12.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "fddb099a7a603f5587aaa0f1e4790bf0" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.11.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.12.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 16777216 + } + ], + "md5sum": "96b454d533e8e46e1e54056186bedf15" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a53f4c8cb46520a53c480c2e4fc4422a" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.9.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a407472cabc23f09e6e7a18e71ee4f7b" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.9.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "00a87753b6dccedf6474bc210fd683f6" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "model.layers.12.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 0 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 4194304 + }, + { + "name": "model.layers.9.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 4210688 + }, + { + "name": "model.layers.9.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 15745024 + } + ], + "md5sum": "ba44f9f5726fc5788335535666d85536" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "062bc39233f4b393902539914ddd7bc1" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.12.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6319e6fe2d4125ef4ae4f4710900f957" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.9.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11534336 + }, + { + "name": "model.layers.12.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11550720 + } + ], + "md5sum": "2267d4b075b04461331af478345a3dea" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.12.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "bafe82192c047fd83aa610ff553e69f2" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6a3183e9a24b5023975a66566bafd1a5" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.12.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.12.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "b0e1e37032c26cae6fb5a4e90104b984" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.13.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a26e02288d9f92793fb54db5686dd073" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.13.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "b29a2dc235c83c0f6a2c5bb1790bed3d" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.13.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "1016bf9c830979eb5669cfc1f5f127c7" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "352b92942fa213287d31bc1862a93db6" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.13.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "02b433bce83998d618651e83b25798fa" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "763ee5cc10d9a37460f28283e3ba9cbf" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.13.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.13.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.13.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "7eb56b013d3fdd90f11add34c1b8d2b7" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.14.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c0c8021a97ddd046df310f9bb7d8288c" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.14.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "10096f76d7daca95fc166815ad11cc0a" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.14.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "64ac37c99647869c9e1172e3eb66416d" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "470f0656a1c4844e6c129d0dbb964646" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.14.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1ab87bec28f54e7d0d1e20575384b602" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "78648b6d6155ad08fb1fdf4283aa297e" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.14.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.14.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.14.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "15f23ef4f58a92efa7b004a76135e3cc" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.15.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "55a5919c45aad0a3e596a7ff042267a8" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "0f829762b8fde5110f5752e3fe7d0130" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.15.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "7aa51b0926aa39f81bcf6914c42a3b62" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.15.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.15.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "9f496910a366614141673d03c9dd2123" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.15.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "7c1166c80c716cf5641ca55fc580d36f" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6ef361e0c26558e693dd0e685d1ee44d" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.15.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.15.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "37fafbfbd22d0e594fe30b20df7aee22" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.16.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "233989fcc58cb1859669fecc9ff30b76" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.16.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a01d3a559901adfc0b0be9edd3a1a912" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.16.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "a01687654d114f164f52d4a3d4455881" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "8912ab6c9e7350b5d04b7b3ef616a059" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.16.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4b3fe93a9b35a0d71991ee02d660129f" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "561b943391c70eddbd4609c269e46ec0" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.16.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.16.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.16.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "13a29c66235bf9e269b567f9709643e5" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.17.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "bedf8a29f0721e3ff9cd6177a2de886c" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.17.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "d3c1813501e3470778ed6134bf11b4a4" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.17.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "8a7e46eda9b7c0f50579fbf93c399b19" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "dd16d8ab1df70f9cc620b8006fccc1e7" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.17.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "8f86312eccd96a065854a168d311b245" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "bed53826334c452fad86027a2931b44f" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.17.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.17.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.17.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "8672850bd802f6fd85a32098250c352c" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.18.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "8c8db04554ed307105c602f2b271e8a7" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "3a91389aa1454d55dda240ef2c173f47" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.18.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "82ef8d516e30cce3f970671ca1bec8c6" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.18.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.18.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "bf191b63697d6b3083dbb46968716d69" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.18.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "85d7710d9b5942418510e8e8f73ef832" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "cc0ac1879d0e7a85df237b0670686edf" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.18.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.18.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "825a0f1ce346e132789486bc7cb7caca" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.19.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c6b546bdf400890f12f4935854083b45" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.19.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "ad162ab66314c082216fc64b7a2c05cd" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.19.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "57efd0f4890720b8213461cb7f8a0170" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b102d4399c024d170e85eeb1c2e1e7aa" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.19.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0a566b2b7b6e50182ee48c2a90486454" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "f52fad0ae62ba3ebb09d167fe36cabf2" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.19.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.19.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.19.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "9b7f4b8b317951ab17672f451e837413" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.20.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "30a3f1200ab76bb1c2f7ebfab14e2b1f" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.20.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "62b86d325dc23bec391aeb05ff401b86" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.20.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "5abf9fa19d23c4b07f056c00cf6aac18" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a30c4cd40986f9bd34d0cfdd9cf744bf" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.20.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5f07898d671ae8a24a05e70fc93ad3c9" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "4e914448c2897af9d820f219e27c8e94" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.20.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.20.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.20.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "d594712b5570cb29e643ac8d7da02417" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.21.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "98d4348e76939438cc920909874596e9" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8a650003d99f8fe513eae3744fdc3f47" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.21.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8a0ea757d8c73c6e6d7acd2c0426f62b" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.21.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.21.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "d9a7f585878eacce5f201612bafa3ef6" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.21.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "79d35abeb80622d8cb280d0e444d56e7" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6eb9dab516a6f8112295ab675ecb341c" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.21.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.21.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "a7b56a8dc7197c45c6d214c1c0329fa2" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.22.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "f4f80aa9e2358907d5a36165d5f69130" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.22.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "385c7cca884f9ead93cec68cac786429" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.22.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "edd6b2bc08e6049c2ae0bcbe666e7a15" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "65a934861ea4c69caaebbba00182032c" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.22.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c7f0daf6eccdac9ba3af45a3cdc2feb7" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "916de262e52897375e11be94e5760ba8" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.22.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.22.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.22.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "c70e20ddf27e185d3907d9d3d92bb5b1" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.23.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "5e4f51bc86e941200c808b780a29fc3e" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.23.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "90ba3688af96b70188affbe87325817a" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.23.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "2b80ae9a04dcffebbc2b3b1d92146505" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "58f6a1143983d49eac34ffdd952fd613" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.23.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ddd429d783e9b8579932772851c907c3" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "1942776c8c0dab7f9c3027e3943298b8" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.23.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.23.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.23.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "323a887ec171ce72b95c96611d5464da" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.24.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0b6e3738c8f8d8baa95c88f389d2dbb9" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "4ea6a6e2ce094336d16dd9ea07939b7b" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.24.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "9edd49bb47d8b7e7ca926f8435999f4e" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.24.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.24.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "4980ac8e8266e5d381944db73c0305b5" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.24.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "4c7409a377e5ee4f659f9bfabd209e18" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "1dfb4cb0c3ce248d65c75047e4c2d0b0" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.24.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.24.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "f4feac9dcc6e53d980bca05ccf661a61" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.25.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "d29c60d5faaa8bef98a44bc3ce451bc1" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.25.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "21a1874290c3f3860773326c631d3bb4" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.25.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "d0344fb95ceca1890aa71a945a0b3194" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f60b3f6a95f75abd43951d48ce007f88" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.25.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "14030af2882cd70601690811867a8042" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "250384cee7b34d8a1b59407e2d552a69" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.25.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.25.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.25.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "8c815231b227f92b4d9a5113e7cb981d" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.26.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6d570a3123feb214fa7489a6ecb179d5" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.26.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "ced6f37b0b5fd730016a7227d3100270" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.26.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "b6ca95c5ac16a41d05697ba6dfc56fb5" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d1ea5c60acd533f8e46b591087e8eef5" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.26.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ab5e725e583a76b03849a1dda254e613" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a494a30b8ddfcf1a9a6278f64b573d1a" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.26.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.26.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.26.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "4bce08f6e2ed28357955a324ce2feec9" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.27.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e05f01861de1248d44f182229a1215a6" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8705c0f10d39579b358d32370a823b9b" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.27.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "51b5ff4d83d971c3361238c94607069f" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.27.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.27.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "e93fc5a370fbee2beafc33173c2e2206" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.27.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "08a4e1432bf406cf005b451a5674cdc2" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "01649d01d47e2e04b8a4fa8bae8ef674" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.27.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.27.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "f5f64bf567551b9e2e3912be3b4c81bc" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.28.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8bd169b00ae7def01c1b322c716cb22f" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.28.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c0ec7e56d0728db56e158817a45f53b1" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.28.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "5623df5e01446c861eed9368a96cfe4b" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "6557beb113740a47bb0e6f87b8c8b3a3" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.28.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b447a9f2bdf813740ce910ef65cb51ab" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "3e4ad4b17cb80cc056c746663516dfc2" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.28.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.28.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.28.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "4db448f55aef5079bb3b972dc1eda472" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.29.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "904a623a956706aa0fa5af76bd29ced6" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.29.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8544ec70973bd870422cca06d7e4322b" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.29.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "3612c1415cfb5711e4a5cf4bb05b7215" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "e6dfd82bcf8854b5763e6df6e722b1ab" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.29.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "19959f8c41c7bc1bd734162f7962b800" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "8ee30a2e8c0ea1dd759ab9a1f6647579" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.29.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.29.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.29.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "d55b8cca2b07feaebeeb39efeb882898" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.30.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "decf42439c00a38540b0b78497235394" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "256182df76b0dd991065bbcc5eddba20" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.3.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "cc7b84655d1a84f7cccecd31519b5548" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.30.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.3.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "175a32c435087d57f73c514433c433a8" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.3.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "7969b6bd1627307c2c999df526c43497" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "270054b5b37e1b11f92b50796b1e8a2f" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.3.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.3.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "20e9bafc6f40df87415ed5d1da4c9ca8" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.4.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "65b3b9a0b90e420ffdacfe28d3a2e512" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.4.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "bd276f02a30e0b0ba3cef20bc120aba8" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.4.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "8e16dc11466528b9070f0aefef610ddb" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "5ff7d50f1d9fdfaaa921ece84e4b60d2" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.4.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "da602082ad3cb81a6fb6d448deea8a2a" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "d7f4404958ebc4030269b7c722df1588" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.4.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.4.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.4.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "dec5ccccc71d25e094ed9b4690c2ae94" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.5.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a561eb4820f06e6867820e7f160a8bea" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.5.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "1f46a83a50b5d528f676ded352221a06" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.5.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "e9b81e08ce91a5fe4454410903ccd0a4" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a90216d5c51ae158f14f0754e3389d8f" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.5.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "aee0323275395b86ab3239747354d600" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f8a8e0fcacba6f035b18427a82acf470" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.5.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.5.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.5.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "3aa3ca8b8247561f4c9cfc797fe93ff7" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.6.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "38bdcc512a19fc28f1416f09debdf7e2" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "6ab0f421dc2298eb0b2d2abb43139f2e" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.30.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "b31ee355cb774201550ebc1ff303c79e" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.6.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.30.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "a9c299554fb451b9b1277cca0ca13e51" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.30.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "67da15ff0c92dce1cdb4d95eb503fac7" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "266bf35871c1889697b2d314bcd53597" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.30.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.30.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "4889baf39475cfb32a93512c397f99f0" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.31.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "13d6d7ea523f6b47520579f6c85b0575" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.31.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "2e83a86ca989e63cae0d463f05888a8c" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.31.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "b293c034bc8aa088b7fce32c4578882f" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "945e19d74838c0d4c700e83029e71e71" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.31.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "56c46b19341bac2fc72b995657e757fd" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "7dd0d96ec1815a55ed2c587577a59774" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.31.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.31.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.31.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.32.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "9d84edab70c0ca473c0d4e08c0e24048" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.32.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "f1ef298a7dae5fb550148b98687d3585" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.32.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c4e3befcf15fcdbfa2f45a803bc6dae3" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.32.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "08bc2517b73a1ec3aff7722d1f8e64cc" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.32.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "46eb968739cef3f8349e6eebe45717cd" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.32.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "00252f4ce1d302b5d184a804077d8ace" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "be2e70ae1191e2e5b1d987b51b756094" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.32.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.32.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.32.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "571476198667e3c2ed12e6a14dbea23f" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.33.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bb7cbe407ab525852f6e49caf658ebb3" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "fbc57d00faa34815fd241d3c708b61ad" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.33.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "af68e5967ae6fa81d9a4e6b42bdc68c2" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.33.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.33.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.33.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "73bab6601fad81d91a11848a9032b208" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.33.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "c00efba3d4f9afb991d04bdbdc3d73d3" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "60ba21254300f2ec7123ff7c47e9a870" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.33.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.33.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.34.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "cbf8875735c9b1cb6660c9812b23f59b" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.34.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a6923835ba69dc280e8511e2d683eea2" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.34.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "b9407c6e4501f3cdeed0be81c1ea6064" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.34.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "ef2ccb684058fe655abd337a6bfab9d0" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.34.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a8d36e55399e732e826f11ae4ec5e851" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.34.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "563be7914aa22c8be3c246a43c0029ef" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "1f82d59e84cbca683b76c54b6fa0a98c" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.34.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.34.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.34.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.35.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "3df8e982ffcefdfaeb9cfb038a799134" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.35.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "1ab22de5551e6af2df2315cf6d0d1167" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.35.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a8c232a082f55b472dbcb12b7e493171" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.35.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "4b8e46cc732669bdc6061632ea9ef405" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.35.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "63da5e5c89b84bc8f58465f62b6f32a1" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.35.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5026084039b948a7e22d24908a4f6dbf" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "c9214df1271b9cd306085cd3494b973e" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.35.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.35.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.35.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "35bbaabe89bac88dadb9652af8da4487" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.36.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9f6414641142cd0cac7441c4e731b0c9" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "f967fabdee8ec14f4cebd583498b8c40" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.36.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "aa00972926007b4df90826e8d9f3ef1e" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.36.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.36.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.36.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "17031ac9726479211013d22e99a4b7bf" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.36.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "09f696fc0d957db534a1d0c6d24684cc" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "66afc062efcf65b868f713cf2627cadb" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.36.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.36.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.layers.37.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + } + ], + "md5sum": "857f114b60b3b8f20441154d601f884a" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.37.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "3fa66bbbf904e58e596908ffa6589873" + }, + { + "dataPath": "params_shard_242.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.37.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "7f6b04af9d306428aab8676d0e740ac7" + }, + { + "dataPath": "params_shard_243.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.37.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "324c66d48e6d100ba90f19765c4cdd3d" + }, + { + "dataPath": "params_shard_244.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.37.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d9fa4efd204707827e1fd29ac68b39b7" + }, + { + "dataPath": "params_shard_245.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.37.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f162529c939d1850a8df4d2a2d23f8f0" + }, + { + "dataPath": "params_shard_246.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "b84bd3d28733275b88fb2130ba0853ad" + }, + { + "dataPath": "params_shard_247.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.37.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.37.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.37.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + }, + { + "name": "model.layers.38.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 28311552 + } + ], + "md5sum": "68f75c56c6fd6d34e64e7b1e0f72212e" + }, + { + "dataPath": "params_shard_248.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.38.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "124ad70e3288ebca68279329f73861a0" + }, + { + "dataPath": "params_shard_249.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.38.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "9c342a4d8fdf2ab4f00efb2d84a5b727" + }, + { + "dataPath": "params_shard_250.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.38.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "906596a1f2c23f7a8792d1a515bd42b4" + }, + { + "dataPath": "params_shard_251.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.38.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "51f375558eba2a1947cc30047748c5df" + }, + { + "dataPath": "params_shard_252.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.38.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1005631fa756c00cc8f3a029bff7775b" + }, + { + "dataPath": "params_shard_253.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "c768dd345e9f0542f238afb6a626fc0b" + }, + { + "dataPath": "params_shard_254.bin", + "format": "raw-shard", + "nbytes": 28311552, + "records": [ + { + "name": "model.layers.38.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.38.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 11534336 + }, + { + "name": "model.layers.38.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 24117248 + } + ], + "md5sum": "089757ed552e9b43f0b839cd1b08b022" + }, + { + "dataPath": "params_shard_255.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.39.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4ffdf8517fe9c8f58458f344a1438e29" + }, + { + "dataPath": "params_shard_256.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.39.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "e7267130507f36cb7af083469bacaea8" + }, + { + "dataPath": "params_shard_257.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.39.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "8fda46b6e82fe362b06f2edde57ae524" + }, + { + "dataPath": "params_shard_258.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.39.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.39.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.39.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "f9c30ce50cfde57ce994555b8fed164a" + }, + { + "dataPath": "params_shard_259.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.39.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "008e2a8740e6145639b9ef0c702df4ff" + }, + { + "dataPath": "params_shard_260.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "75081ae45c2d2b15d25ad519248a3163" + }, + { + "dataPath": "params_shard_261.bin", + "format": "raw-shard", + "nbytes": 23101440, + "records": [ + { + "name": "model.layers.39.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.39.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + }, + { + "name": "model.norm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23068672 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23085056 + } + ], + "md5sum": "711cdccad9028f6975f529dac477b404" + }, + { + "dataPath": "params_shard_262.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.6.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a561a7f21d679d224a2e8de6f93f62e8" + }, + { + "dataPath": "params_shard_263.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.6.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "a268b53595edc8915bd355593bdd1e65" + }, + { + "dataPath": "params_shard_264.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.6.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "287969efcf204344fcd9a15526eafeb3" + }, + { + "dataPath": "params_shard_265.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "252163a4d71154a4f05fed13aee90ae8" + }, + { + "dataPath": "params_shard_266.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.7.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "4426a827bdb98e0ec16582f638294ad6" + }, + { + "dataPath": "params_shard_267.bin", + "format": "raw-shard", + "nbytes": 23085056, + "records": [ + { + "name": "model.layers.6.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11534336 + }, + { + "name": "model.layers.7.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11550720 + } + ], + "md5sum": "84045f863aec7fd1f43750cb26732bee" + }, + { + "dataPath": "params_shard_268.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.7.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "5880ade62e34d7cce4793e1f345121be" + }, + { + "dataPath": "params_shard_269.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2fc8759b704bcf9eb7d038684d9e7013" + }, + { + "dataPath": "params_shard_270.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.7.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.7.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "023c7d162f6c54dd163eeaec98f7abed" + }, + { + "dataPath": "params_shard_271.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.7.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1ec521b2b9feb69800be41703b1087b2" + }, + { + "dataPath": "params_shard_272.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2816 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "f60a461828d2977bbe620437c79d50d3" + }, + { + "dataPath": "params_shard_273.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.8.mlp.gate_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "dbea397fbfeb694cc148d1096c97294f" + }, + { + "dataPath": "params_shard_274.bin", + "format": "raw-shard", + "nbytes": 28327936, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.7.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16777216 + }, + { + "name": "model.layers.8.mlp.down_proj.q_scale", + "shape": [ + 8192, + 704 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 16793600 + } + ], + "md5sum": "0d5349c354925f5b442513eb16724417" + }, + { + "dataPath": "params_shard_275.bin", + "format": "raw-shard", + "nbytes": 92274688, + "records": [ + { + "name": "model.layers.8.mlp.up_proj.q_weight", + "shape": [ + 22528, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 92274688, + "byteOffset": 0 + } + ], + "md5sum": "bb92de0a6cd0e564b14c781e4e8491e4" + }, + { + "dataPath": "params_shard_276.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "473062a2cb2f45e845278b58c8b1ac0e" + }, + { + "dataPath": "params_shard_277.bin", + "format": "raw-shard", + "nbytes": 23068672, + "records": [ + { + "name": "model.layers.8.mlp.gate_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 0 + }, + { + "name": "model.layers.8.mlp.up_proj.q_scale", + "shape": [ + 22528, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11534336, + "byteOffset": 11534336 + } + ], + "md5sum": "ca862c3759a36ba30e529635383d4c13" + }, + { + "dataPath": "params_shard_278.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.8.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "89b53ca5f34ff792d316d7036bd5f486" + }, + { + "dataPath": "params_shard_279.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.q_weight", + "shape": [ + 24576, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "bfb0bf807caae04ed49b831e1d8979cf" + }, + { + "dataPath": "params_shard_280.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.9.self_attn.out_proj.q_weight", + "shape": [ + 8192, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "20ff683eb65ece3b8b00204e0fc9a7a4" + }, + { + "dataPath": "params_shard_281.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.8.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 12582912 + }, + { + "name": "model.layers.9.self_attn.qkv_proj.q_scale", + "shape": [ + 24576, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 16777216 + } + ], + "md5sum": "1498527f4562fd9d2dd9691346bb4597" + }, + { + "dataPath": "params_shard_282.bin", + "format": "raw-shard", + "nbytes": 4194304, + "records": [ + { + "name": "model.layers.9.self_attn.out_proj.q_scale", + "shape": [ + 8192, + 256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4194304, + "byteOffset": 0 + } + ], + "md5sum": "f8149cf91f163e76b17129dbbd6f3aa4" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe75719a5ece3211be5ed57ce97fc94e50fb88b1 --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84802677e4f8cf466a18acf843c6f0239517015a2708ab7d636c5b0447666b77 +size 1048576000 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..b51bc8955bf2456659a078f0f98579b1341bb304 --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4f4811b2f1342617f9d920b75dcb506dfd13b97eaf50a4a20a0a6d038d3a0c +size 131072000 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c63dccd15ba34e5f69becaccb5500016f2dc341 --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b082f7e5d23ca19f4916f94b8ad5a09d363c6b2a53d5534d8f9b7c30dc8c9113 +size 92274688 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..710e63d6ac42d6a6360eb900375df1ad84e87a7c --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed7616e08f47de8293067d690bf740cec1f76c4cedca53054bb5fa73ed6c1cc +size 28327936 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..c9182611a514c54149556a8509cbba4dcd92f711 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00350a1f460ea1d91964d809d6acce1375819f3b10aada6db9c52bcbf5943302 +size 92274688 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..f958e22f8bf1735da4072083263d63ce894d4bff --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c19b93a7134194db12edc8e4a9f81aac07458759f5961894f8356ba71ada5b +size 92274688 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d23849fab19e72f1e6e99b10db1a8f0d8c4c60f --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2aefe25b64b5f36c1427d957616619d09903ce4d2df87f2ae582c152a05fd0 +size 23068672 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7a59af56a5102078424e815cac68349523ad7d4 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635767b73999733f0c215977adb3edac470bc1b7c7f2462101e4e211739ef857 +size 100663296 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..e811f2a1f56dd80a3044826e57a0dea9568d7bf4 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fabe87e587ee143288896a9ee75dc029f3f0208f2b4d1ac07791b6ac60d7e74e +size 33554432 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..70e1094665e4591b6dd66aa2d9f4e8dbfcebb455 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646066f3e07655a787c3932d5c86b80217cc4806529a3e232378589bd5bb195d +size 100663296 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7ddc9f9395827c7c25e541a245d1aa12ea92ace --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e22337f443c11edc80c3cde94f5fc1cc8640478686a07e53caa260791ebd43 +size 28311552 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..2113987e46d51e65150736cf81f835c55cebf320 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee49c9c27f30476690647603b4e2850029f91291811c78ad5a7db0c38b3ab10 +size 33554432 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b622efaef3c28ddfefaf3636121bfd201b67a45 --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051859d6c1af5a78665b3fbdd3577eb909eb77b33cd0c9b0f7593096e79d593d +size 92274688 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..990679564c47c7068816cd7adec7b924fb50cac0 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c648e36c5649aac062c2f38af6bb80680370e179ae42aa973bee6f4ef6f0ea55 +size 92274688 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..9881d6759ce72dc5ec98dc1ecadd7f2d3f775051 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2f1012b90eeebfe2897500cd0498e70860609f0d8fa6ae0f09d4a78ba74b5f +size 92274688 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..45433f26682eaa4da0cf5f8d7123226916210949 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb90978f72ddc6643989bbd85b0a8f7d1b06367b38a3cd524da265448b41bba +size 28327936 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..20b3f51137a6e2be6608660c8505664aa134bca3 --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e74d645a79fc5c5b329c0899997c4b5bcfa2be82a67749d578eecf66c79f3c +size 92274688 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ab9599bc19cc13d1ffdb29e37a67bf4f7811f9c --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b711122e94fbc3f9f649c3a0d48bb95d0896e244ae1a9591913f865301ae35 +size 92274688 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..98132a46458d8dda26549b2b14f57e65398a5419 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c291147f1dd68b6db1e5316952242eaff8e350add2d5409bb2c7d5bd6290c15 +size 23085056 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f56fb27d8da125abc84103932a2ca973e23898f --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571fcc2e3c8cdcb009f26ad7716f53442e9307240faceea9fdee02cfb0cd9e3b +size 92274688 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd18df82e3dec1a1b1bab7541bd98878ebfc46b3 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70723267f2050fce7c9f61a50c60d201562f6ed38bf76ca50df0142bd396f32 +size 92274688 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..005c2e84afd3c568a8ca75ed5fe31c4f4dd5d67e --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ba43e8e84c1d30ef1102be7d7b3e9ce4874bc0a46336f60de8f3dc7e84a223 +size 23068672 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..c86dbf57d350f62113730a465a37c1921c6a744d --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec06014bec947f2ffd6808b87a1fa6610a9cddfd0c1ac9eb4896ddb6f908654 +size 100663296 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f33f79675774bf5e99cf9b5419f28d2e22696d0 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c434735434b5f4b222d3c8adc576d640ec685324da9af08eedec0798bc097394 +size 33554432 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..05efa4a7658bc4733abec0a88d0a4867c84e09df --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca0a185bdf0ea0dd414ec5fd55efe8a1d2aed426cce411f2bb7253cd034f737 +size 23068672 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..6810b9cb19e646c9d5b386b7df1b12158a23c971 --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b43a7e827cc5e13e28fc869c578b8d1e1ce02d5ac6c36f706961b507ce55bfc7 +size 92274688 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e34a684b596018539d7d27d5945649cc5f7bc8b --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56fa1a7dfeff62038b62f091576fbac9003bf0301e832bc3fe05242b9090e23f +size 28327936 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..9675565a2e2c7a054d3197adaad18fb79e89a9f3 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832cd30365986ff5a8b8de733c02683499a246a9c55167b6a94d4d8503fb9e50 +size 92274688 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..185e357acf638e849a32ea38087a393624814b2c --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e25da330e12e9287e2f1ca424dace10aa01bac256d226c68f37a76d38b6d970 +size 92274688 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba69d06379dc1392d10d8d5b572cb09ffa518abd --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2e5793855d7f9c9f94d581058ba1b0589bb230ee17c20a61f6f7ae2259c5da +size 23068672 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d1c81da22a5d1648dfbd5f6824fada2843a392d --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08dda5583331e88a6cf103c5d39e5dfddb3dbf98f8f429a1af0c45a169271efa +size 100663296 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4eb1cede261d0195c26d2bbff0ac55d7e2c4ab8 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daff8b133875685b55b4a36d4a7addfe7e79b3d5566df26da4f6546333933f7b +size 33554432 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2509e49c76a79013842a7a5d074268e0206563a --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9702b1865017e468d8c1f40843d47c2b12425eb5c3c04018a9b202dc2a3a550 +size 100663296 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..c078d8e0c0d76f41f482b21d6b41540cfab139a0 --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1b1fd75a2afb50d994a5e4140e3180a3abd8d65cc669da1f75828fe7952a0c +size 28311552 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8ffb5bc1a8b0c23e083b2aab2e8fde890e731b8 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:defa33a8816b99b868388db66792520a6954ffc27842997f91971493c450a0e6 +size 33554432 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe08f803ed7677f0e39237118aed2fec109019b4 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a8c40cc19d10c22e2306f5deb21c18a59dffeaa72983a0588d86fd2ece64d7 +size 100663296 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..56e38d1262deebecbf5d035c1aefd208d6348a76 --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0079328b581f51a8348006a14eca2fd8e34ca4a3b8b1c19a6a194de79c1303f4 +size 92274688 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a9b196cc0529dd112e0e1b85307cb10e0c51323 --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69695f7a54d2d452e873aeae6ce45e2b5065534b1ec392ce8ad35d39e282b80e +size 92274688 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..8b25ec9c26dce605063e4978b9f42d635679f973 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63b0b2377bc9cc3ec06dc352519a4cb3a8ddd00143be1d54f78500c82f3c163 +size 28327936 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0104711bdc0173cd7ddd49301d39c1b2efc2ec0 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9970a6a70b44d67ba46805dce787431bc85ae04386c64582b6aa804e19365c +size 92274688 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..8422a9e232e1761d1421947179c8ecc415699198 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5e02ace9450ee0c53055cd22afaa1e27d46a55685b0e11a0880bbf7412b074 +size 92274688 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..74a69c85e6bf3c90f9a1b96fe3a648bc234c442d --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e3e85bdbba4d2d22b9aa9442f83a4704d7af40d01b0ed4b280826e29c6092c +size 23085056 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb4c5fd60454d0445cedecc6442ea9bb47f64f30 --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:027da1d1b23817d68b6aa5f228777f81b4986454e1ecca9b20b9f0ecd6b692c9 +size 92274688 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..903db106cbce32a6a513f411f8dc1f30f47d4ba8 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8647d3d4a1b76e095a4c7dbd75db81faaa758afc5507e1f75fa851cf9ee090ce +size 92274688 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab533982e000af73769c83f4f7cb405c413a2a31 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21de27871f1e8c1bb4ef6027c3474130d1cf7a44edf647343d9274a9ed3bda2c +size 23068672 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ed9a9cb3d22cc7f423ebbd4bde55e19b46e78fa --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f53fdb55ddd1f8398505a3f8bb1de6c868e30a34d097db7c1233aa70ded7a3 +size 100663296 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..3baa47e38ef0cdf9f07c6c65100a5cd486f9b28e --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2da80bfb4e4139f51147249de900d08b8e5a60d1074a263570c883354554d6 +size 33554432 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..6087314f9f5f330326a016adedc8eeeae7c6a999 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c51bdfc309d3bd7a13e7ed443c9a05c70e1a58b7ff1068fdb550517af72d4d +size 33554432 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..f39983716339274d086029069ebff46255dce4aa --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9900ff4242ea6ec9147413f642ea1fdbd85eee94b45ab98136532ed95b8afe9 +size 92274688 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..feb90b430749ca8669ec0141263a4de6d529a7c4 --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1692d717bcad8edf8f18eb1a8f8b7f88e5001d750a70e7baaef584c7c5f5c0 +size 28327936 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a670f9da58a63095ddfa0291219dbf7b5addf79 --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb652bfbbc361b105f6739e51f3104794ceaba7c7c8e662ed5e4d20528e01505 +size 92274688 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..f11af8a2e912fe6aa2cc00e12e380afd6ec42ba6 --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16a694dea64cdba776251e89054c8f41ab437b745c188257be20525f69e6389 +size 92274688 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..16ed01c02a1ed7b5afe93451409c140060b09533 --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d6eb5680fd6ab30e6ec797c1c2c5c1d893501368d5d3f0bc73eabb409e953c +size 23068672 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..3df36b073c98e1e8a41bdd286b722e4f181f8242 --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6867f23ec68ad90985a356a36b2af82dbebceebb2f3a5a1bea97c059d1bd4ad6 +size 100663296 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..456ef9d352bf2f0dc74cc2bb4c9f7f3a8d96c294 --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aeae5ccbd360a14c4b7e22608cf4eb9d1206a5e980a7459505571d9604c2147 +size 33554432 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..2922fdd12a4d85967da916eae357b984fbf8010a --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abdfe6bb895c5f06eacba91d132ff24a2e928bf4213cc96f84f05ac15c37938 +size 100663296 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..91be22bdc261d8bb0c526e4167cfdb0e36396d78 --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecd8179ee315f8084b65490aff86e3d52e85be67206a5443c2cfea7715bd450 +size 28311552 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..533daa6e9c09536651a3c5d60c8c2d4e7f0c6e80 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c536154354a98b6261cf64da94356cdf5f70096c0e8811530c6e6074caa87aa +size 92274688 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..2806b179535951de902d9adcf7e6dfdba15e297c --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b9477c5e49725cdcd332f1aac9be676fce308ec31102162059286ae1bf55fd +size 33554432 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..81ac085a56cbb35405f1f41581c77411e6f158c4 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c289b518bead76ddd010998de442933c78fb21e9d49d75d833aa800ecc1ae0 +size 92274688 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..564db9ecb6773fb24cb70f070bcb32df0fa3e28b --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1953f9c071ecc4a55cfd5b6005d1192ef629ffa14441069b04c4721121d6476b +size 92274688 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8bf1abe71aa306427e9b1826573618c329347a9 --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e7e3f075ffa2d4c82ee815f17e0a1b5b058dc204f6cc63993017d560e14c26 +size 28327936 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d0908b1c98f89eb5aa2b644c8710bc66ce97397 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998a5768c327baf6f54d5244627373f03f23aff2fec22ce770b4286e4300cc92 +size 92274688 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b40fbd1f626a19a009a831f6ea832674c82626c --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c9d459405d97822230a2dc82787086c2ef9eb7834494663b894f932137baf7 +size 92274688 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0dec1d25204a30d2b3c8f3b0f21c2b4364be4b9 --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687a667f65b0b29bf1644e1c8967181b20e0eaebc0e2497b82d84752d2202219 +size 23085056 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..2dac7d48a0945545792a58899169e07cf2f813ae --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d656a48d3b86eea65e02b5ccceb28ee19fa277f64ffc1a390e9d4021b78298 +size 92274688 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..82680b9c9c5f1d9db489426d9b4dd5f05b3e39ca --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c47c921c1844856e20e1a0f8ee48bfaadd92344505a770d09329f10b2725bef +size 92274688 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a8ef85a945409d905b249a69486ea79481bd0db --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff9ed239131372aaf92494c46e4009a520f9f88823d7a097b2c6d92c673b997 +size 23068672 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..af9b1b2fd22e1feefced208696306b9d0ad39b42 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c0f3799bbc22c02b8cd528104eea3b44ff024d585019e299cd238e7584b97b +size 28327936 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..23fdad5b276b51c8d9b211543cd387ae8cc8a80a --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7744944ca25b315796a768cd61e01ab2d6976e1148ea5e81201142454deba8 +size 100663296 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0620ee1571935da4e4c7d11114c9155c66aa0e0 --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e45e8e48a67725c6b20bb20e2a60dbc704c66192eb27e7ce776e95f18c25161 +size 33554432 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..4fc71e6708b97e68aec21adcd4216c2f7a87f445 --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539b536e594584e4d11b8be4ac74711044d1278d5b34233cfa6c189d4ea004a9 +size 92274688 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d659262c986ab745d622d0fbe1751b66af6a5e3 --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a316a3dcaed27a60243e87f20a32d69ba8d51f7892620eeb28d98b0c8308ab +size 28327936 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..08d8ad32efcda3e73c1bed9175606c4ea04fc4a7 --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065be81a61c48aef19c6a4532685933932ceddc2ad1e11fb927767d07d1d6938 +size 92274688 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..f40f548fa7e0f6228b9b39471c6ed0061a51a1c2 --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd7893f5b31f1ff7b5d2979e7a1f38c5c18d83dc0df4c826d08ac6162e1f177f +size 92274688 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..8522d4b14f6f70ffb7946d9f8a028e7c1e8e536d --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79115a875a9c75ba16816357ca0347ea4d442ca5defffbe2454ce4a08780b55 +size 23068672 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..7df45afd792cb70c9199fc40aa25b0bd0b53e84e --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f1d365f555182ee8acef4b195d2096e8687992d65e2c4428e0fb13ccb59a51 +size 100663296 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..31d0e8fb46e455e58ab313ffc5ab1abfa4085aa9 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af17e864b15e0ea5071a6b78e35a1bde2d4ffad185274664ac4dbfe74a3f346d +size 33554432 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7c4ae8031c141f721379aabd8ad177e55df3ccf --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85021300a243f0c30ebdb062efeb2fabf5f063152d6503c58e39353276119c7a +size 100663296 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..684772bde4fcb5125e9d73a83f3fc9f108224036 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df5c2d7e06f3514554541ce2943d549d65e433f007a8aa1c76999cdf2ae69ce +size 92274688 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee2259db8dcecdabbd9a610af9d9bf49f96bb047 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0cc43907370dbdf786f8f6a7f73cbe8b2cae8be2f4873a544e83b5f2e863f2e +size 28311552 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..72f9fcaf9a7effcb6524472fee39a5f61f7e1e16 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f718253ea1021c8b0dbe7cc2aff58144f3261faf9569243a9693ba81d153c326 +size 33554432 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..478081dcdcac4c85dfe9af2bf345786675dd7fca --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8858a37f435aee5b7dd0139c77343f0b6204bca5d662caeb2ea8fd0638f8d61a +size 92274688 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..e071bb3453b770c3221143a12a5d5c073f913045 --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac7feb54ca379c54b5c55e0cee3eec9a9eb82855c9082b76d77a813709bff7d +size 92274688 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d5a62a0a9fd77d6123df1bd3b7a117dc57d0558 --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeec47a614c79d86b513d5ce6aedaa2b9fb8392e8e95940a8e6b1ef5255d3376 +size 28327936 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb960bd0db5d478277f2d715276d8781c5a32a7f --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295a0b86aee601c83264ba543a848e7f9e757fd6969d9dd24d836b279ef2ad84 +size 92274688 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..7fa9c6072cfa6fa7f14a562c4738f4f39fb4719d --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2df75ab9b88b0864781790f44a94133d3bf173f5ac6a9803e23b14b244b476 +size 92274688 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..19c24fbd23167e49e886ea0bcaa2f114c6afbe17 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac3f833a751501e0466d00d46a3d0beb382d61d44180ff28fb5eaad20e51c67 +size 23085056 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..85aad2cfbbd096fc6662dfb5cce43302a74aab26 --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc76b089e3c018fe8a2263e9e8084082f6b5f56c3efcdf4a5945889c6af9436b +size 92274688 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..83aeca951d18755dc16a2aaf1d3a5b2f9bfc9199 --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d451d0700c9efa2b1e158fd284e1ffc8a7e433eef5978442641ddce9a1bb117 +size 92274688 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..b746a5d6c43518acef4028f4b6985ba08284d4a8 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad8cf7240a9a2e3aa23efce159210fc369b0b927c67ea12fc8f717901dec4c3 +size 92274688 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..d84d1e60f84994c529c06146ca9fd096ec1e240c --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47452af0a47c8bc5418a7b8c4446ab773a1591046b1d92ba93dc213c47cd8989 +size 23068672 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..61ff5244cc5f84827b18f2a3325e8a6864eed531 --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63df0a3b73f012c22549385ab7333d6b8b6992611559273bc97ea4b7c5268c5 +size 100663296 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..efca55aedeb80c58e7d6a84ff8f37a200c0b6cb8 --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba15b8e0c1ddf213a227e5abdd46fa75156f1f0782d1933afd0d858016bd94ff +size 33554432 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9e18b7e5ecf1e479600e281ab74a1765496d488 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9678c084415f6a87db7346d5bf5156633f1dbc9a01dcd1cc11c5b56eae9bb5f +size 92274688 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f4d85ec1a1926dda6cac38a24b412d22836d076 --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d36db9fcdfa3c3e13354b625ce7e7cb8cfa435a7b2f7b16a718dfc1d360d8f +size 28327936 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..90fba6c905d55c5bcf4c28de729272026ccecb54 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f86755b660923bb89691eca62b8d09521795816d7ea2c29e03b156f84f7a950a +size 92274688 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..883b549b64f0fa57099562e328c6abfb02123163 --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a85bf408a69e0288131fdb2404713fa855849b76b1ad8071a014468e38d9f5 +size 92274688 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6637dd54316c4042777bd162aa6a56c7c69dd7d --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed340a63938eeafec8c13a1fcb4990db6604e7753ced40fbf83f9612e8eae344 +size 23068672 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bd99922e7726f657851661bb0929a23199a90af --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2605f5e8602d3223e0abec0d2a7c8f1565b7278d0c0575402679cbc8e314f6b7 +size 100663296 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6fca4727b8d94cdd9c7f3284a2282777ac58309 --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e358b2f1a2945a1901eb86d9e6be5a40987c9c82daaeb41bae6401c0ac65364c +size 33554432 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba57bb8f957c39feb133907ed31cf5b5f22be392 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914f1cb2ea3afb3e4537dd8a8defe54341f315e1fc7402f020ade99f9b2e9c2f +size 23068672 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..a5b75e83facfcf9d98f03073685f11be292c77e5 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08c591c447c2b402c9dbc2db58638b0bb8860c387ed26079dfba98118952987 +size 100663296 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f20f6fd8e00fd73626f9680f3d3a5f6d19d2f8d --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee84921492478f39689cae7c0f411b08604cbeae35e8760ab358de0137bc3414 +size 28311552 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..2790279296dd3f0bb0744974a845ddfb4f659f61 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19776b1a811ee2157df4377593cdecdf0040236b8c37445785bff2a053dacc9d +size 33554432 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..57da0c5a4ca7ea63065c93c97453d164dc9d28d7 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2240cd392f1894f9eefc26f4bd372b79946c6fec8c55a21ec04313e69ad19722 +size 92274688 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..02c598b8ad883c814f5300052cc8092c644cde45 --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6db72cb190de1fd82165dd0a80698b1db9b7acada586ccdf791449573530bc2 +size 92274688 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8a5220d176de90196e1fff26dbc12f799d7132a --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50305f03efdbc45d582b394bce85da3af43738eea60484c9aba5c7dcaad742b +size 28327936 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bc1b704c08d6bd1cf7a4e500e051c294800950a --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0884695a63cf85908e9d4b2a04fca146746240a5f4816aa129f36ad28cb8920d +size 92274688 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..34b12670ac5a3ec0140765e9f5535b3a06b5be3a --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585ed5276efde7a2aa42ba450cf0efbd7912b1674b8817f3a8098015b10a15ce +size 92274688 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bf1a6e6d7472ed236428bda65c59efbd348956b --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7fa4688c5dbaff38e8bc1c38b7c522247b3dc48974ca432b35c59bb87b11f8d +size 23085056 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbeadf0f062bd5b3621500bea1ff0b92deb3491d --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620d9f70c288d9950ba7eccdc29d3ac0c230574d911b31104ca94a561cec079e +size 92274688 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..0405c1c1f7f2e56916d95143d058f624ffee0377 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32736aee39481c7d41fb49bb97f6c03cacb5d42c557bcaee6e644a51e30075dc +size 100663296 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..c01c2c07c0e31ecbbe443a677729a4a0c03c0700 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e1a68fbaa9fc7df62703a4d1090755a999be25afbf4b04e32976efef9723eb +size 100663296 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ca202c800f0a2b28e31cdc52057035ca7ae89c3 --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15e7180c4ce3029505cf08b88a1b9539437567fce605eca0c43e59e0665a585 +size 92274688 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6aeab70b93ef7d4315addbc09dde13da1ffa106 --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1249648d097759b2584687bb0a6b7b20c74f28041422831ea1e64f93b15008bc +size 23068672 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..daf649d3ce9cae6cb710e71fb0923201fec76e9e --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f04ecce9b0491115d332060efd76ed0d87a147da7926c9fe863df6ebe6e311 +size 100663296 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e80cc6be1c73b9b4805192304c98d7e37df0399 --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a397eba69ff04b60507e2f4804991bf7b93948a39eb519d86e39485e98d00956 +size 33554432 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f4521b7d676bb671271b11e5f11250730bb7bf8 --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d462fd40a6884fb091f55c78c77413ef8cbc35999be7fac14b4bef9bab86b23 +size 92274688 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..27bb66457b32a7ea81db9ee28677fb4e6083412a --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75cd4299c80ff2677c1e3f6395c6736549888cb1e501b2c0d2f0b1fc2a97e6cd +size 28327936 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcec3e41f894aa9d5d8da923db05acc6755003a0 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebea3ae4b6626ae3d590e777b55e8c58b114f40a859f15fd20cd70bc83cfb450 +size 92274688 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb46e9c8c89d940fcfad2d829650c4ae20c34cb2 --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608eae0d8ddd6072721db259ab9cfce0e731331605e887dcd329fcb899215073 +size 92274688 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..481b094b98e2d9de23f115cdbbf48d6e408cd8a1 --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b57bc2f74a56c837a95178f932d0f6e856d92c45b403d12050cca9ff52133a +size 23068672 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..8672f7591acdd184890554ecdb084a6dff6ff724 --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc83bd518d38903e6914d2e6f5e5280733715bfd3d54355e62072e2c68f5c6f +size 100663296 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..18c1578bc2ef5c578ced54a8f2cfd2be5b72a47c --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6051f1e0eb7691aed1777780cb513769d03dab8e8374dc8fb9f7e54bf826097 +size 33554432 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d44a331b78e18935d99199ae362942e1a19b64f --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4871a22c0b4c90d54f7ca7ac82176d9cf6fce77760d478f0654b792fafc9d8b +size 33554432 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..8374283852098a29f195f1ffec8b6c79928aa187 --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f3996a9735f67991f9e796e003339769c187e202fda7182d5942bc14bac696 +size 100663296 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..2582ed39c86a2ff4cbc218efb817282a6c660a49 --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b4ece926c7d8f5b8f7916a16655118147baf462f2d906b64593a75608327f1 +size 28311552 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..47a737946809209c261d4ab1397d90b8b9ffe9a3 --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0e19504c745eaa6991e7c74f329d54b294de2f5f001bf26efba2ba00002c93 +size 33554432 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..09d4f1140fa3b768b3b4c0aba48556a8c2ba1069 --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca09f1dec386afede732cb0ac0ea606ea1b1e45f83e0201693867ed088dc794 +size 92274688 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..4017a15c56e579bf48d65697fee02915d10f556e --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97f2030a3b87296847d1b3db2995cac87ae06c0af0908b1f48ff358688b1cd9 +size 92274688 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..e274213e6db609d5d76701a0a322c63459aadb66 --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb17a2498837799dc40d27a9847b332befc535c665580d8b753e9cce43cbf152 +size 28327936 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2e5a2f9e615f2c767ebb0aa7462d16f30f16ac1 --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a8b5efe4bd68b5ad909fc03f8047f2e146be60ff9852eb1d7ea1c5cc204453 +size 92274688 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..e886c2f37898a9861174d4f473d6cc34cdd836fd --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc5a82af831a67f12bcb2640b5bd08fcde05b9261f69998e0dfb60cda9ed562 +size 92274688 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..4df479e0f0c561b41f0d5cc9369608c5cb8598cb --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6698129873ba069c4f6aa89d1ff897d622a8d953fc395a37c1541e8b2b77a3ce +size 23085056 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..a46c427db4dfa705da7d35e9785dce3097effd41 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a31a1f4c2dcf9c5ee75dfec2c57131d119e946a638a047fa7063c1b2f8e093 +size 100663296 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..bfff8558e03e598ad98cbdf45a8e17e0b9580ad3 --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6c6c84c7d167999b1e97648f6cf2a3be309ea450675cb08d5d89f8b8176d9f +size 92274688 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..4de8031c19b6bab40b91e7ea8e91276a1b328a6a --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbacf2303640881b3fb13b8e176668f59e9560b1332677674d2f29aebfe3fba +size 92274688 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c05e5e8033407c239a2f8b4f48a92499e3e7e10 --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2df40c9b30c1cf883f66fa0d7c9536299a9ee5929d1ccbeee6654db97e65ef0 +size 23068672 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d014baae518cd7475cbffaaa6d5f9551ac517d4 --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b343cc9a844d5381f518b2dfbaee8aa5fa7cd36de5089b69ad1b65bdab7dc447 +size 100663296 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..47b1324429ec7d679ff26c73362984a0613eda1f --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5894c7152683f48b8d6443a60d35d65897299a81535b10d2a5ca74c94e5101bb +size 33554432 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..a1337095d9883ce5934146b2a63d91077b4bbbbf --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a24123706fd51ec2e635179c956959abf356b49165fcf8c7959082f5b53a2b +size 92274688 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..f737ec58f309f04253e26d438f9eb77a1ed2d9ce --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735ba6373f64495d1272f84ffd2d67a1be01b0ed29bb67e490d42d7bec848c71 +size 28327936 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c5370ddfe044396173541a14fbdff173f4dcc5a --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:674c181f849356fa4cd96ef50b46423e2ce01a5dd51d48fdbbf367f41e861e78 +size 92274688 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..694c41061a6796cac5190f490ac7683f0b5dd4c1 --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2980a5524833adf6bea892502e86b451fd8a6d2365967e3e49fb49bf617ec968 +size 92274688 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..379b1fc7fb5cc8df1b0d9913c1ddc2ff271bcee6 --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72002de17f5f7ab9c4aa2567e1a08c024e72e24c7be2000a17ce030bd87d48fe +size 23068672 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..8babbb34f4f46167e99223965839dacbf84cb20a --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb618effc2e0bbe3c47172a4280cbf4525bf0002f7d7ee1b7db32e0ccf341efe +size 28311552 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4f4a6c23db49a99909ae4d6619c7f674d70006c --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649349ae48be4d175dc234d2bad75853c26d7c22faf91a4c8b16c0227fab7e58 +size 100663296 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1bc1cbcfe54d63f6f0f0914bc78efbe33572d52 --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed01446f78d992c10634b1bcb4b233e61313cc6c0834b5f2e3cd304ffff630c +size 33554432 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..90dba095f35680c0840a2396ca5475ab8da6cbe9 --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f18612fe3c2a678207b78f876369494a749560d4d7f3628be5338b4c527b14c +size 100663296 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a17bf50908004bf71d9e27699fa3fae71f413f2 --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29277aac52fdec85a7f9019ec80e28e31f8b7736ec1aeb256af1143df3cb7eda +size 28311552 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..d192467933f00229dc0047468f1a6bee35371155 --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea70930951e47764da6cc622407d9ebf305649a94debe500bcd6a3776e25c21 +size 33554432 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..f08e1369d49a939d656a136588d04e3f12499cbe --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb24d3d484bfac0f8a3c323d31ccd94e24479e75c4b647de9a02b71f96c126bb +size 92274688 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ee17078cbdbf38768d5bae3723c356145cb470b --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10448260250d5363b0902358ada840ad83c610e53ca746125b03ba8d87088479 +size 92274688 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..caddd57ee7a5b42017d9588c74d291437c3e60c7 --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909c96fe53d39b5f3cba28845c971ce7a83f7d481869337c1e6f65cb07b658ce +size 28327936 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..208cb9bdf73c97f985ac173ef37f0e878082f046 --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28eae00f7b40a0dcf9a890e26297d15adbedde57ba70f12470a6e824c4238466 +size 92274688 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..1693e9b98b610bf71266c6d90388bd5f97aaf582 --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b12930117a49b40313f9fdcbaee75898e039b3bf076ea6c1d57068b9732de531 +size 92274688 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..bca526931abfbaccde0bfbdb0ee232a2f21643d6 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f828b46fb29adcf1d5b17ad68975a0c4123f53bbe3c4d04698eafa57eb45e28 +size 33554432 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..16d81546bdf6e5c37b7a469bb83d9f7e25550875 --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd337fcbba357eacb8041a88b0f6a9a2c800b9d7fb66d6e11ef07d295284ebb5 +size 23085056 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..716c9d4a8aa4960e4badff1ea437a8d48258fa4a --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc9de41cbd1cb0250336a57fbd496b9c094be2248604edef1591c35de5faa87 +size 92274688 diff --git a/params_shard_242.bin b/params_shard_242.bin new file mode 100644 index 0000000000000000000000000000000000000000..03758e7d91535f301773cde523c76482376a0899 --- /dev/null +++ b/params_shard_242.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9b715cdc51fbe7c7d98c6697607599e2353068aa074ffd807600d3159e40ba +size 92274688 diff --git a/params_shard_243.bin b/params_shard_243.bin new file mode 100644 index 0000000000000000000000000000000000000000..4be11c6579391f6f46e39278a21c809b4bd9bbe8 --- /dev/null +++ b/params_shard_243.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51441cf6146da76bbae85a82236f1b4e9d6b933ae0827e8957b31e8f75a8d99b +size 23068672 diff --git a/params_shard_244.bin b/params_shard_244.bin new file mode 100644 index 0000000000000000000000000000000000000000..8a13e76fedef43f5656c396b36b7a27efa99887a --- /dev/null +++ b/params_shard_244.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdf1260a53470c9112ada64cca93ff3807aba734f37e41b34af527e6d717ad4 +size 100663296 diff --git a/params_shard_245.bin b/params_shard_245.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a330cf34c44c972f507c05b145ff4fdc280db45 --- /dev/null +++ b/params_shard_245.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b43eebf061125acd7837d14d603b4948bc0b0ce6adb8f9b0e2da7d4c445f30e +size 33554432 diff --git a/params_shard_246.bin b/params_shard_246.bin new file mode 100644 index 0000000000000000000000000000000000000000..d87022379720dffc6f14759e323fbd696d7496a6 --- /dev/null +++ b/params_shard_246.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff1ba65217be090260b859c7996de9e7d602532385ad781001ebdb6c3ac7bf8 +size 92274688 diff --git a/params_shard_247.bin b/params_shard_247.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ace62fc1b43ce53fb2d621660cdeee6bb82854b --- /dev/null +++ b/params_shard_247.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86cd1af675fa1e3aba25a95755500a033ba97404b28b1cfb1c4570e23a63288e +size 28327936 diff --git a/params_shard_248.bin b/params_shard_248.bin new file mode 100644 index 0000000000000000000000000000000000000000..70c8e2db3cfa84ad7d61279895bc1952d98cecc8 --- /dev/null +++ b/params_shard_248.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9716d900d749e527ba577286ebe30ee5872752db035f5e20dde9ed24813a440 +size 92274688 diff --git a/params_shard_249.bin b/params_shard_249.bin new file mode 100644 index 0000000000000000000000000000000000000000..9757aa769834f7218b45f88f5740da057c6e53d1 --- /dev/null +++ b/params_shard_249.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d1fc6f7b24a65f7807b3aeaf476b3e18c2f136356309c679f25480869f0d4fb +size 92274688 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b22ec026407c46943f87f47b04e920037f9add3 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58aa36381e1327f4b5c617cd35cc7fb76017c5137d5cc7be567b6c9112e4cdec +size 92274688 diff --git a/params_shard_250.bin b/params_shard_250.bin new file mode 100644 index 0000000000000000000000000000000000000000..9df33001af4df88e4d5061f13a5afcde9584cb48 --- /dev/null +++ b/params_shard_250.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56eed04c17b30531c828c3bdfae77d9a6fe948ff636342dd3515a654985a6ef7 +size 23068672 diff --git a/params_shard_251.bin b/params_shard_251.bin new file mode 100644 index 0000000000000000000000000000000000000000..b1fa22b03813f4567606119e4ce93533b5a75622 --- /dev/null +++ b/params_shard_251.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b08af90ae76f4c9a385a348b3773152864cb2e05535d0c7a9c7a0a881d7fab0 +size 100663296 diff --git a/params_shard_252.bin b/params_shard_252.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1c9247790828dc9dc76c6f418d417a79b21fb2e --- /dev/null +++ b/params_shard_252.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bbc8f9615540040bcd177330b16e44cf004d0a4eea4c76c23c36963920fbc1 +size 33554432 diff --git a/params_shard_253.bin b/params_shard_253.bin new file mode 100644 index 0000000000000000000000000000000000000000..2fd6a66db4ce45cf937d37cfd7680918e959056b --- /dev/null +++ b/params_shard_253.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9f64e365e50035d3830cdb703679d959fbb3f3d2a3b3b20f7a6f3c764fc41d +size 100663296 diff --git a/params_shard_254.bin b/params_shard_254.bin new file mode 100644 index 0000000000000000000000000000000000000000..374636f74afcebdbca43e2dd456bcf791fa23fe8 --- /dev/null +++ b/params_shard_254.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1939ba64116c27e16a081810d532070621347ff5cf2ba867ff94b3288d2d9b64 +size 28311552 diff --git a/params_shard_255.bin b/params_shard_255.bin new file mode 100644 index 0000000000000000000000000000000000000000..a083fb1c2d1972d6b9ee59f03727e5ebafb28053 --- /dev/null +++ b/params_shard_255.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf6bed243bf3baa929c37618e4b275a78719ff6bd9e76966221760e8bae769e +size 33554432 diff --git a/params_shard_256.bin b/params_shard_256.bin new file mode 100644 index 0000000000000000000000000000000000000000..72b0f969c8451c2acda597e06d4aa9dda4aa8859 --- /dev/null +++ b/params_shard_256.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09162e711d7e9454e34b47b77b5979cbc36d7a63b7e9b3e73ddac7aa06a59f65 +size 92274688 diff --git a/params_shard_257.bin b/params_shard_257.bin new file mode 100644 index 0000000000000000000000000000000000000000..28556e889d1bc74643038c203c05e26c0d67b398 --- /dev/null +++ b/params_shard_257.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d69bf01a3d41e33cf13a1a0c4f3e720689f27bb37579b97b6acfc0fe494e57 +size 92274688 diff --git a/params_shard_258.bin b/params_shard_258.bin new file mode 100644 index 0000000000000000000000000000000000000000..519529baceea5d743b9d174073dd886da775f078 --- /dev/null +++ b/params_shard_258.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8006c225e991975366dc6480a324187425731c25b1b574f74df53f9298459c0 +size 28327936 diff --git a/params_shard_259.bin b/params_shard_259.bin new file mode 100644 index 0000000000000000000000000000000000000000..b36aa36619f6dd2d41238956d064f7269e42101d --- /dev/null +++ b/params_shard_259.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70cde0cb6552d9bea8ebcfd60c0fd45c381676dd3e44ce5acebf66e31416dcb3 +size 92274688 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..01693f2abc703e0119643004eb160030bdd75b50 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7526e5e4479d7b103f517770accdae2e797109b7dd91f2a0fb3502af8a09a0c +size 92274688 diff --git a/params_shard_260.bin b/params_shard_260.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a5d2818da938918de0092154f698986600d936e --- /dev/null +++ b/params_shard_260.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:900c9ffea8a9de6446d83fc045803b0c0797bb28412f14f86d075f62d0a8d3f1 +size 92274688 diff --git a/params_shard_261.bin b/params_shard_261.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0c4800c52cbc28046fda6c39732c9a65ee94b33 --- /dev/null +++ b/params_shard_261.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a3060d229cd223a97406332b39c0e81696285013c6e2630043c4d3c2eee5c0 +size 23101440 diff --git a/params_shard_262.bin b/params_shard_262.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a0fcad40f87ad8f5386c4f737edf5f05de148f2 --- /dev/null +++ b/params_shard_262.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6ac0ea0e4c7938d8f56c8ff8b6be41ad53f5a178ff9a3403604d034edee227 +size 92274688 diff --git a/params_shard_263.bin b/params_shard_263.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6e2c3e99d422697c68696c03e7028053c152b6f --- /dev/null +++ b/params_shard_263.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af85ad7744f95cd4b813be37aff03051932af4a80b6191fb49cad9cc186b6117 +size 92274688 diff --git a/params_shard_264.bin b/params_shard_264.bin new file mode 100644 index 0000000000000000000000000000000000000000..a06b108b2f398b38362f33c0849b6199b5429bc8 --- /dev/null +++ b/params_shard_264.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57862f2a1c07c2fdb8ae1a948a71fcdbb9cd384899597d2d7bb99f6f94aba75 +size 23068672 diff --git a/params_shard_265.bin b/params_shard_265.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2ca565550697d5953cbf7139e4184cb7ed291bb --- /dev/null +++ b/params_shard_265.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134791a1ad1ddd9c77557c79f35ee3a304e526180c175317b2d3f4a67b53f78e +size 92274688 diff --git a/params_shard_266.bin b/params_shard_266.bin new file mode 100644 index 0000000000000000000000000000000000000000..a56074982ff40197d056f52badb3515b7069ec2e --- /dev/null +++ b/params_shard_266.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c480fb935e6f0c0ce12d2eb40a0efac5c75274db2588a934418eafeaca216422 +size 92274688 diff --git a/params_shard_267.bin b/params_shard_267.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a0bce3f76842e2e79bd6ec251dbefda1aeebebf --- /dev/null +++ b/params_shard_267.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc89063bb9c338a5f83ef6cc418b180ab5693e5c4fce9dd850a780660ff44f7f +size 23085056 diff --git a/params_shard_268.bin b/params_shard_268.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e90ec80813dbd8d473c0c2cbdc3419f5f6e3b8c --- /dev/null +++ b/params_shard_268.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74d3864e06b3740e1c90c5b9693628eb49ae4f8ff9f7b17e5b3f7cf37ba9af1 +size 92274688 diff --git a/params_shard_269.bin b/params_shard_269.bin new file mode 100644 index 0000000000000000000000000000000000000000..0113c9d182df11f53fc293e79b533b936f3a43de --- /dev/null +++ b/params_shard_269.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f78854fff340fc4c44f6a9eab4523dd8aaf8b20555c5dbb8ae29b43fb4fefde +size 100663296 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..32c63f4bc239b08121142733fbe045943b54f5b1 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4128565091d681ca965b586398c536be43896a69c7659c549a98aecfbf038f3d +size 28327936 diff --git a/params_shard_270.bin b/params_shard_270.bin new file mode 100644 index 0000000000000000000000000000000000000000..81d65667b3e9465567a3fe63ceb0062b600219f1 --- /dev/null +++ b/params_shard_270.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e9d593e33fe5352bcefb53e4a19e727e2effe8c8b46363a6ca8cb6eba06ab4 +size 23068672 diff --git a/params_shard_271.bin b/params_shard_271.bin new file mode 100644 index 0000000000000000000000000000000000000000..a74723f89733167719e9d8554b2cabad286da5fe --- /dev/null +++ b/params_shard_271.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1a1e095d02a97bd31ecf580ba1006f5c4472e2f5f0234301febd5d4c4a11c0 +size 33554432 diff --git a/params_shard_272.bin b/params_shard_272.bin new file mode 100644 index 0000000000000000000000000000000000000000..55cf5c3b062052721334ff481b45208b08a03559 --- /dev/null +++ b/params_shard_272.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892ca02ef0e71bd52ad730c193138fc3d40a2e4fb8a4307b544d830c919ef733 +size 92274688 diff --git a/params_shard_273.bin b/params_shard_273.bin new file mode 100644 index 0000000000000000000000000000000000000000..572c9b53973d99f370abb98cd62138a1fa1fb29c --- /dev/null +++ b/params_shard_273.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906686ca3faad523f6988c4b7a3f166c7f550d05658ead3ffc843d0f05250dbd +size 92274688 diff --git a/params_shard_274.bin b/params_shard_274.bin new file mode 100644 index 0000000000000000000000000000000000000000..886a7149d2e4edfd77a72fb7690df586736a0912 --- /dev/null +++ b/params_shard_274.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d78cd76b26e820e2da452f6ea0f78714ca03a6eea53aeb29cc2261e119db71 +size 28327936 diff --git a/params_shard_275.bin b/params_shard_275.bin new file mode 100644 index 0000000000000000000000000000000000000000..af1fcb790727d6ea7b0c43d556b6a1e485b08294 --- /dev/null +++ b/params_shard_275.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5594a32a078a1a50647baaaad03cf28ad29d41a245993c69ccf058d2c0c01e9b +size 92274688 diff --git a/params_shard_276.bin b/params_shard_276.bin new file mode 100644 index 0000000000000000000000000000000000000000..151f52e87f5da8646c60a209713c481e767c39f1 --- /dev/null +++ b/params_shard_276.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6311336c438486a4b13b3e8e8074a82a5876e4b02735e20fd8083ef4a4675f56 +size 100663296 diff --git a/params_shard_277.bin b/params_shard_277.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3ea160c34975810f7db43306a6b8d8e21aadf77 --- /dev/null +++ b/params_shard_277.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088162fe8ead24f476e4f30d87de9680662aa59cf743e3763a5dbc51b38d62ed +size 23068672 diff --git a/params_shard_278.bin b/params_shard_278.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c91abfb22b146c94df11c5eb9db0a178fa057d8 --- /dev/null +++ b/params_shard_278.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27be5d641f41fdcbab4a93eda19a7744f2c4f3775623b42bc9d6e573aa4c3854 +size 33554432 diff --git a/params_shard_279.bin b/params_shard_279.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca753f2cd08f13b5fabc12ea904d3019cb09bb9f --- /dev/null +++ b/params_shard_279.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75cb221c1f277ee35d15495d0d58725dbce204907e9bedb7d1e1c7a3eded88a6 +size 100663296 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ab3517f849089d226b44f2b675fd929b22e72e7 --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c841be08567b2a90238a66d5ffa789bcad01e72cfca029956d13d1a1931c1c +size 92274688 diff --git a/params_shard_280.bin b/params_shard_280.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cd406eb67fd07ffed5b26ed8880581d0454e40d --- /dev/null +++ b/params_shard_280.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a56fc08606ca4d3b213b4e33652a9d86d29c8ca6423f7ccdaaba640194e52a8 +size 33554432 diff --git a/params_shard_281.bin b/params_shard_281.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0627893ac039e6d9816e6f4c837138a9dc1c562 --- /dev/null +++ b/params_shard_281.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f0014c95aebd1fe8cd4978754c3371c6a6bef3f853ae0bb7fd9124d47fb955 +size 29360128 diff --git a/params_shard_282.bin b/params_shard_282.bin new file mode 100644 index 0000000000000000000000000000000000000000..27f9dd7d003951b65b6f6ad35fa7210a214db8f9 --- /dev/null +++ b/params_shard_282.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f540cc10e7bbd75b8abce20188c14e99e564c8b1aff4bc6ffdb6578e141a72e +size 4194304 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab014f909f0ccc71582c21a979a63fac20a003f8 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e523603cb1fa03fc8bbf66c74d2351173613039d0136f5faf0c49d85c0aed195 +size 100663296 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..ccf7017fe7f202f02aa0aa9a0167f7e5ac0f0d32 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c9ab0cba4d5b9b5ad17449bbd9d1bf9a50c69c8831214c8a0e69c1b984c766 +size 33554432 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..77538a52d43618db446af9a2549e439655e8b13d --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7667681e3146093562d440ae5255bb63682fb245edc960e5f4c9628e4a32eba +size 23068672 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..81e7ec20c35f7deadbeab1cf15b539e39a85b64b --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac56c22105256fb575f1770e02d95b8cd58217317ce22e3e42a37d0cbd9905d +size 33554432 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..6cc7a926692956326df6fbc65a9d7eeaa1f1dc71 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e8e7f03506ac0409fdfe88ce878eb50126e9e15eb51148b50a8f1268bc6d33 +size 92274688 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..f46079dc8f54f85d7cf0a9b952de1bf754ac441d --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c68e9dd52c613bd5fd4fba09c1282545aced6e59e6a19d853132d043e03907e +size 92274688 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..40bd7ccf0f31d8aecbd59953f582470f0e266239 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c477a746977e0dd5f55b85d815d62066b84a8b3c1e4fb00c9f676b9bd213e34d +size 28327936 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..7bb2f5de5857fda7f73ab6e212f1f7fca5a7aa01 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd76dc57d99bcc6eb911259f0173b6960053e18f62742aa2dbf468f3966a62d6 +size 92274688 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..25086f2ee7fc29d19f09be577c29c09fa92bebaa --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f0b4c029494425bd5291ae9aede5f6683e2753e3431b5f2c9ea933fbe3861b +size 100663296 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0899e966fcb34846c23357953f97db446be352f --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ba5df126b32fcc96085c90c44af4f3d04db536661313f9fe6441e2f9c2fff4 +size 23068672 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e9ebe611af9f5f6468480623ae1f146e265b85c --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04bd1e4a631e0ee17a5d89840f988986a6347f48972cd65c3ad22dd061685ba +size 33554432 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..16a581af573e7cb5a8c17c34fc33c797827b2dce --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e8b80a7a0366ba1764f753f893a4d499ec37e712a3c4b84c8823b31e4145736 +size 100663296 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..83562b6f5aa5d46ccab2a134e35f52fc918f143c --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7916b9368fdf328cae9be15ca0dd98de809156cb95ebb46a14f48f906863377a +size 92274688 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..42063bb5946dc58f8612f56f7e7b529d5f20fdd3 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda6b52eae96853ce31bdab9e313f6408396bba2a53bd96fbf666157b6a488b8 +size 33554432 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b0e513082c41b656b26856b7504091389bef0d9 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b08af975167a3f88bf2c03d9263bab266424196f62e199acf97819fd6f8a311 +size 29360128 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..98e4a05f3cea24cd7b325e0440bcb5979faff696 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeafe067b67d8c2bad5c8fecee6558ba0780f9d5b18c622dcd419fac080c56b8 +size 92274688 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..98748576562d2d03841c46ee99956ab5c36fbda2 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7d820a04e303689fe7cc100330c5aed6d5f153c14c11867b0eca59e3a5fced +size 92274688 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d5610e46af06def26552dfe7dd6e76bcf808074 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c80b31174d68d855457082755a83426b116550a81f5980c9491e2d0740f07f5 +size 92274688 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..0512057d14b136dfb8e772d9e3b088a315e46ed2 --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a56315745afcd38cd9655ca763979cebf770db4cc5f4d9f7cd696eda287c7cd +size 27279360 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..6732bcea3f8c8bc8e5962ccd14692a6a1cb27fee --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8074917c8dcccd339b268851095b86434b5fc8b1f7e49a6bcf5e29935615fa85 +size 92274688 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed40b340090fd690f29f8dfe7e48c3062b260901 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20eb11381891538c347a25b62fa237287797faf9ecb156ed8cb490eeccc7c918 +size 92274688 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..b206c81bf9e8d8a58fa889d35dd5ccb7cc1e9157 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0866f475942b1d89b80e182cd5afe3d32da9d9fbb3eb356531889c60008a8b3 +size 23085056 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..5397e4f4cd0779971a6f53d0b134fd7320cc44fa --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d67dfa8e3efa160b0463dbbae3ce3a85e28df1e10be5c16ad29ad206a0bbc9 +size 92274688 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4dadf9161e53f65ce4c33b9ebfb440b427a5530 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c520ed86028d8439768f86edffddc6113574c8e824f7e9fb39d18be0b7d0f813 +size 92274688 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8ca5031c6a2f2a248fe3fa9d39ca60e627341c2 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fb6fa951e17bf689bf212ddc0e56d2f27d3a3782b63d6a86ba27274d8d269b +size 92274688 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f80272b89bc1884d422c716277461aef682e985 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cb183fac9d67d5d29b97b8400d7d42b25ba3d8f0621800c03aaacd6c5388ca +size 23085056 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..2af2563c81e4c0087cd0b84f02f774f2570152e9 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4aa26577a5e7e28f1e66cad55c6349e164bfabf5968b515ba8090c59309df3 +size 92274688 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6f1fa587126b09eca597035c5c1ef6b95760a5d --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c788a8ca00b2ea9b530da62deff790ce9b344539e2d5b76cf3cb2625b96054a5 +size 92274688 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..657c6c893e71cf638ba8b41eb6230fe4b0140eea --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d41c147453c5aaaffaea749df6b012bc9765ab626da3b783640b8da2fba7864b +size 23068672 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..838907df29028e9c81a3fe3db52dab308df41038 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4575d4f41af4d8df1c366d2af5433bcf658073c1c4b2de82328fd26893e09868 +size 100663296 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..67f2d62664b9ad82f5429c5886463d78373d77cf --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4135accc76a4c10b4b36b9fd597da269a11d3e1b98c2d31a472ab78c9a8054f +size 33554432 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..314052369934f4275e6fbcfb961c0d30d3109dae --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6f0ac6199ea98786bf4a8ff230a1c5b302a9da3dfdd6f39f535dfd83a26050 +size 92274688 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a11f86e5b3660ac9a9f557ffabdd460163c62a4 --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43620c9c25aa4605177c45b952954802ec3346040b402d60e779813a2003f8a8 +size 28327936 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..098862eee85a2a1725121fb288231233f5ec10d0 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c519076a8ba7e09159f03f76084b1c573c8f0c12beba86465597bc70d241fdf +size 92274688 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b8c05131d83804b537550560ccb5a32e4ad4af8 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1522635be75515aaa7d46bab7f997fecfe49ac9af0c2b4f2ce995214aba72bb9 +size 28327936 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..1171ec3692c65b97c145ce48eeaf8003d366d577 --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f693b8506eaa9f1de1197d383d9bc3699b1291faa7ec1bf15a087b4ffc9b578e +size 92274688 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e764e553a0a7de68caaa21d10118cdc1f43870a --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1fae61a0062d683a76a2819b435dff366bf187eef3a01a979ba7c126c6b9ae +size 23068672 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..f572054dd4eac3d1d8c8b8684aaeb21fe0ea9e82 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515497cb8bc2247ed9639afb952060f7e9a7f9be7621b3fbac83035824f43bc4 +size 100663296 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa167f40753edbc562cbae5c0aebc9a9b254dc4d --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd6ac3ad9cb538cc07ed294c14e47889c579804f1924c3ec8e1cc5ab5a46f83 +size 33554432 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..13c861db57e0a49e7313795d6a24d8972dd055ff --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8cc290c3f5640cf0faf6b4be9f24ad14d4ff23acfa72f9b2bf48b8bbb15e8e5 +size 100663296 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..94df4502053213ee4d143d03ef1a912ed6b502ec --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974f93908e56a2051b422b11c8f4400f05f533a072a6ae4c36daf2c5eda824b7 +size 28311552 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..2142c588fd7c305dd0aeba72e75ea75dbb24876e --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac71a470c530e79bfc8803022e8d662fd4fd78a5d22f482efea6d2ede6902c95 +size 33554432 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..583087ecf5592fb3f0ef17d8e0be81b73590f50e --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a18ababe71e0d4fe5b7b86951fd7eb20aa4f5469f26292990f17fae6575a194 +size 92274688 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..a20c11b34e37000d2a45a179e8198a6361116613 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c85f43529eb9c1a19127288d7ffd71c8d9ca23abe3e599ae2278725d9ee22d +size 92274688 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..373b0926f4012b4a7bf26f09f72180e2aa5dffe7 --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e6a05af2631f08949f508cdfd9a33510cc15258077457aa5ba585e2486521d +size 28327936 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..f62e5939c3ba4182d206bff5cfef20c152e5b466 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce581fbbe9ac9d9bb60e9fc7c1c1773519fabc1193ee2fd9e6e30131475e4be1 +size 92274688 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..196048a4f8914be2777064397b0495183586abc2 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57920150cfea3351995566b34b816375d342fee23fe15156595f5011b7cb769 +size 92274688 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..16161aea5ad6c9d02403a85ef793dc92d5770017 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec9c5ba49a1299bcaab5c6c46b695c942f9adba1e3042be31ae9a2380c6bcd7 +size 92274688 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..806279c0d34d600372df9ac36d99788d5817b75f --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca8e649fd82002df9804c27f1b8153a06b8ecc7f813610218bcaa94e12bfe753 +size 23085056 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..368d598c8f87ed84fa5b0544cb4e8a1a965e193f --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5799936cc8459c67e7576d350da9c0d88fc307ef4cd50f72f27f895d8974856a +size 92274688 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..79adf3996812b684a3e31b071a01422ae8a20b6b --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d705d450868de90d80fb28e1b16401fb06068c4336caaa07ad5d544f0f7124 +size 92274688 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc78080341dfb06a4a469a65b2fcbdf84fabce68 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:575bf5d89a9e416dd789338be5417754e17b7cbbc43c8b2e387c8f79dc520d28 +size 23068672 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..183938e909f191f8ea7234e49ca67af74db265cd --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedd2d231edd599343d8e5e0068c0186947c8d68c7149c710cdf6e0b84695e1d +size 100663296 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..8acaf165cf81d24f5083624f9cee665dcbba3b26 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668f0aaa76ef18964449d7a80328cfd160114bd9dc7ba93ddcd87fb55a16da8b +size 33554432 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..293e5feb5f057faae468d3303c1e81fde3116f45 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3adbe4b90d363d5298a846546da26e32053a094b95fc799df9c6eb52589c27d +size 92274688 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..347a26c748fbca00458673df3624233c597d8bf3 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed735471293f36abf14de45c74decae600fcfac11be8ccdd34fd7d62daaf241 +size 28327936 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fc686a1a2aee2f1e553948ff8177cfa75a963d2 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065cb88be105562cb858737d43d00c828851d629a1e36f752bf8cda7f1b822ad +size 92274688 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc667d05021161580e35238fef245afa02b8e461 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd196f144d4193206f674f22103ecb2a58a4cb7447b347c3e701c9e1d81625f8 +size 92274688 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..8097fb702f479f418b10e8c60011149c414b132a --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402b03f3bf69de8a156ce9af3a201f343c17987097b21ebec8af5e37892b9e17 +size 92274688 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..148fbf742469f7133e92dfaab8ea24cb956af562 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31403b18b7d9171193be83301f270020d4a53c8af9b2b94f4d8eeea66a0833c +size 23068672 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..301b7a78eb04e4fa97b77d6842ad5d3901f064be --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08cc69897ae35ab205605a580495ffecd21082dc96c1b168d9aa463453e2ed6f +size 100663296 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..ce96ebcca8e734df10d485b8cf102a8b29f729cb --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02adf7eae7956ce3d9d1d6e96a8b2fe5332002e52da4670f9f396bff041863f +size 33554432 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd4cb3e4671dd5c6e51a1d7f9fabda1fc5e571a4 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10af3fe6d7dd51b73a1d0d75ed8ccce9585438ae9fd9cb7f7042788d2c313332 +size 100663296 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..8229ae4ee12e118f7485d8c44e32fa7b2db32ad3 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8516d52d8a3b808f90697d9da265bc301cd44e77535c0f6e3a4a637e4f98c410 +size 28311552 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..1817ac531654dc03559a71c80b4194c5d938ff6e --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b021a4de46084393a83ea294fee198f8ceb883653ffb0fef50445abdce200e5 +size 33554432 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..e794053ce42dbd3bb7d99dea9275b46e39f48682 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bdf266f22ae733f5e2282a5ef4deb80bab797da1879ba0a6d45e493e2b60d5 +size 92274688 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..f000721826d92ba09ac4dff0c0a38e9e65bb7466 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd75d83701e886a05ff1825eda041dcb2a79bde4049995e11fb50827cef9ff48 +size 92274688 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..5dcfdc7fe892136f66294b2ba1acbffe9c57d7f8 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16dbaa7355ed98228943929629b9db8991e5b7d7766dd18818edc7ddcf763f9 +size 23085056 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6b543f14f6023f875d42c6c5cb8de1a3d2b4fcf --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:751f95582bd686734188238946ef4f3413d4d6ab8a3995fe5d358bd57a3889c7 +size 28327936 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..0aaa8cc541f8d691f48c8c9acfc252bc1ba26fed --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0afbd7ff476518221651a6ad8849843db1e9af68defac23232d146e10c71ce1 +size 92274688 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..92530283deee5c28257c5725a2a3f8ebe133c1af --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99f59ecf6e4b4074d244218997926c96ebc8237b208807a2c31e132af239612 +size 92274688 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa92b02f42174e9e1477f06b84658b47a284d579 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052a59fc820df6e3f795588f071ca2384d670910027d96b4cfc5629b4f2fed1c +size 23085056 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..9cf743399432429da5493e32cfc4ca040423ef07 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb90f239faff9ed1d791e8c7172d93b00f7fa067e8a3f617ac297efb9ce1146c +size 92274688 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ab7447f1ad00622ff745981ec12df01333a25ab --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d470aae2a2cd8abf1f12dc6e4ac4b239b45dfbc16ae0a88ba1bed077f8da24b +size 92274688 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..c79634ea3c5d4f6c64d4c646b8db2ae0f4d6c56f --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5108cdec0c53658d54c6333eafaa0c0fcbf592db689baebb0fa7543984471d94 +size 23068672 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..eebeaecd4ba371f54324fa6d90e89954a1e1117e --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523bb3be2ec43a02a149ce35208ab1d990606d1163938ee04965330befdf7120 +size 100663296 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc9715333e28d90fa20ea8c267a4df0bdbcd7f58 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03f0cd059a26d98eeab45d81c03a1267bf4b79eec508fccb7a573bdeacdd181 +size 33554432 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eb704291de55554ee750e80c543a60a69116139 --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efde370216ec9bb2883e7ff04a40b4888f7177f25db265c7699265d6eca6caf +size 92274688