diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md index 20004291aacfa6744c64d8bdf192378d39ff1d78..0567c7a137625c76594b7884bd2b5e2f06b1846b 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,19 @@ --- -license: llama3.3 +license: other +license_name: eva-llama3.3 +language: +- en +- fr +- it +- pt +- hi +- es +- th +- de +base_model: EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0 +base_model_relation: quantized +library_name: mlc-llm +pipeline_tag: text-generation --- + +4-bit [OmniQuant](https://arxiv.org/abs/2308.13137) quantized version of [EVA-LLaMA-3.33-70B-v0.0](https://huggingface.co/EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0) for inference with the [Private LLM](https://privatellm.app/) app. diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9e7e08f5c8e277065c653a7c72987d064f55208 --- /dev/null +++ b/config.json @@ -0,0 +1,5 @@ +{ + "quantization_config": { + "bits": 4 + } +} diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..393a55157baef20f573630d27b087968848f2327 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,11583 @@ +{ + "metadata": { + "ParamSize": 805, + "ParamBytes": 36381212672.0, + "BitsPerParam": 3.4891900844756822 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 525336576, + "records": [ + { + "name": "lm_head.q_weight", + "shape": [ + 1024, + 128256 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 525336576, + "byteOffset": 0 + } + ], + "md5sum": "a65f7121bbf8b8d868ec27261f0ea394" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.78.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "079916373e8439416b26c803021590f2" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.78.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "4a467f55386145a23ec568e5b475acdb" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.79.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e10f073ab500b9280d273a5591669093" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "db57537a4275e462d06b49369f058c30" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 31145984, + "records": [ + { + "name": "lm_head.q_scale", + "shape": [ + 64, + 128256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16416768, + "byteOffset": 0 + }, + { + "name": "model.layers.78.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16416768 + }, + { + "name": "model.layers.78.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 16433152 + }, + { + "name": "model.layers.78.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 20103168 + }, + { + "name": "model.layers.78.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27443200 + }, + { + "name": "model.layers.79.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27459584 + }, + { + "name": "model.layers.79.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27475968 + } + ], + "md5sum": "c9935a365acd087e52becaa962536a22" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.79.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "21d25ba3ebb409cf8cb942c3ca15c871" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.79.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "61864aa3de8b994bc547a7da612bc177" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 525336576, + "records": [ + { + "name": "model.embed_tokens.q_weight", + "shape": [ + 128256, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 525336576, + "byteOffset": 0 + } + ], + "md5sum": "19bb7d1345a41484942df187882e72cd" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "4385b3eec159eb8924eb4fcd346fc255" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e3cf6990f2359e255ff30327fe225226" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 29835264, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.79.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.79.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.79.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.norm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.embed_tokens.q_scale", + "shape": [ + 128256, + 64 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16416768, + "byteOffset": 9732096 + }, + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26148864 + }, + { + "name": "model.layers.0.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26165248 + } + ], + "md5sum": "7caa9736dc48afa478de3ce7bcd123b6" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7e7fa5c2a28d6189a8a3e0e44b93c7a9" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.0.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "25c50f413c669352f9fe083f99df24ff" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9d7409d626896665cd2a7f7bd23783c8" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "6fa627de17d7d5a9265395f9e5985e57" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e6e058383bace8c8b8a1a44266108aae" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3551358a1946ef0074b4605d9ffa4067" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b62d95a534623dbb7ac2c84ea7d29b23" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "10bb311d31a89b332978a6ef1c93d029" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.0.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.0.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.0.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.1.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.1.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.1.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.1.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.1.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.2.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "5637c60218ef6a5acbc18e5358e20c6b" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7b1523bd56a76ccc5420b16e19f8950a" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c664d357dd39cf8309ad73799404d5e5" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d913fb3661e40e94a6b06cfc4a374a73" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d91b06ddd90bb0c98e265b6c5d37e7ee" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "61432b6af07ce8300abcb8498a1b37f5" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.3.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bf8571b565285c13c5738e5af9b6dd30" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "58e4bc58dbf9180d62e4ab440382e2be" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.4.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bd29056507389a2168c12262bf8c2984" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "459c8f19196e5e0b8f90bf65f7d02035" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "424982e2737949f21173ee0027152722" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.2.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.2.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.2.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.3.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.3.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.3.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.3.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.3.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.4.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.4.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.10.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "f4ebc197f285a586dc473431cd70b8d7" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "fff435ef77ee67b7009decfbd85ed635" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.10.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c87689882aebbe8ee0e82ef873f30f53" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "eda41186789b7b630bc766a8fcf3ed92" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ab6f74ce49f74d77635fb2085b9f36ca" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "31df8d1d2c72b02ccf970a06e3cf06b2" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.11.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e5f1146267aca13b2413ce248382e211" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "19839cd95d91874923b6e3668c64efd6" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b3727af0bab99a27b512a132d063a363" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a1cb61616690137c47788b6f0b5ab0f4" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a0e04a7c7e61809bcecd6bb237524f30" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 32833536, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.10.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.10.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.10.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.11.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.11.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.11.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.11.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.11.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.12.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 23117824 + }, + { + "name": "model.layers.12.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 30457856 + }, + { + "name": "model.layers.12.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 31768576 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 32817152 + } + ], + "md5sum": "7a0f439ee39dfb0834f96a3d7656fdab" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9c22c9791b36f7d7130ee135c44c13ed" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2f795ab7dffa6d6aec6d8ecea4c08f80" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d688d4bb7774d53ebf3c7df759415d77" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "895ec78beaf86813dec6271a9fe7d8d3" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "7e026a2f5470b98e1ee0863ac7169019" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "897ab178a94d32fc5b411601720fae85" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a07b062e6b12cfe5aeda52e7d132b1b9" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 28147712, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.9.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.12.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.12.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11042816 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11059200 + }, + { + "name": "model.layers.13.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 11075584 + }, + { + "name": "model.layers.13.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 14745600 + }, + { + "name": "model.layers.13.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22085632 + }, + { + "name": "model.layers.13.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 22102016 + }, + { + "name": "model.layers.13.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 23412736 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24461312 + }, + { + "name": "model.layers.14.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24477696 + } + ], + "md5sum": "486586a5ed545b44cfbfff0196f94446" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "ccc6b5a6d61a7d38f13c5c50720ec74b" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.14.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6f2ea4b46f95a964ce85f62c8841f077" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "874424c7a11be564544f023d0fc5e66d" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.15.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4bcd9d986b55e73164fefb81fd85ce9d" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "1ee68df07b01513df401b7bd27a4d53f" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "238fd10527f39aefbd96cf9aeec84c19" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "10bc6b383a0ef458a002a74a4a0d8533" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "233cfe1b2f6251009f2e5c376ae49b18" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.14.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.14.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.14.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.15.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.15.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.15.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.15.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.15.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.16.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "1cbb7992d099992979eb45229a094d66" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e76744d8869155d7ba396cef7b4e469d" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.16.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "59fc2957d0b7b8ef918b73d35808869f" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b5252a71aadd6a5d65cfe3e1af2ad3ea" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "decb1f74d6b7780c1bf5f58d3dc925af" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a10a2e835e64746cee643df5514bf13f" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.17.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "62a1fb1d9d15e07aeaa05864f6c1979e" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "5d75c4a3b2c7245ac2e8b10df5b33931" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "90b32b90695635b8bce07d60a95e211d" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "51ae7ded98490d7d1390fdf24b29d07f" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.16.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.16.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.16.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.17.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.17.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.17.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.17.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.17.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.18.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.18.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "8b2bd2b086ecfc0dc6e343434401df67" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.18.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "52209f9eae10e50058598c9738f795c0" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "46ad35ec9b89b0726a302c10aa41ddd2" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "6a8457909af459f3867a4cafdfbd0478" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "90d3c31af2efd5b3e5dfb092243b8229" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.19.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5beb0a8f9d793af02a87c36bf63b68e2" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c19a628173d75a4548db8bb78a49e49b" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7e59e393075f24b698641489fefaca68" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "70dd0d58570e814802621fdf41c80516" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 32817152, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.18.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.18.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.19.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.19.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.19.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.19.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.19.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.20.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.20.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 25477120 + } + ], + "md5sum": "0028ee1956ddf06c33f4cf64ddc2f029" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.20.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "da9272f8f2e80c28c9de0866664b8f45" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "46884fb006fe62957bf54f1d444080b7" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "424a3ab4029bdebd40fe6c3112fde6f2" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "44354e9c7d871b1191f963b428f56474" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.21.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5395e460fece233d880f229d4f6b65ca" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "83ea770c5566f7815f9a0b532df4b752" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "cbfac70d672977e68bec1a9b19c3f34d" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "07243a39d5d6c7bca3c415aaa201b996" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3187524e781e1cf85278fcb4853391fe" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "68ff0bf5940cf94b90ffd0e1082bf50b" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 29196288, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 0 + }, + { + "name": "model.layers.20.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 1310720 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.20.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2375680 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2392064 + }, + { + "name": "model.layers.21.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2408448 + }, + { + "name": "model.layers.21.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6078464 + }, + { + "name": "model.layers.21.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13418496 + }, + { + "name": "model.layers.21.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 13434880 + }, + { + "name": "model.layers.21.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 14745600 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15794176 + }, + { + "name": "model.layers.22.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 15810560 + }, + { + "name": "model.layers.22.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 19480576 + }, + { + "name": "model.layers.22.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26820608 + }, + { + "name": "model.layers.22.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 26836992 + }, + { + "name": "model.layers.22.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 28147712 + } + ], + "md5sum": "b0464fe0f2c5ae8c1c6cef05225c7af7" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b285268e3e170f8e0672507132d5e5eb" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.23.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6bee485fe1eeeba530fa091041765705" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c7a7b4aa23817b52eb19079f6e209095" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "63ea476fec6dc52eaa59085b21fbac4d" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "16484046269996c75abe52dfa77c217b" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a333f3f806ec5397a8e86c20f365f300" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.24.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "76b83ea0013c6d397c6593daccbe2b93" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "555749486d47169aa63132849b28d4d9" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "efe4a491fdc5ed71271e290639d004eb" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 30490624, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.23.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.23.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.23.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9715712 + }, + { + "name": "model.layers.23.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13402112 + }, + { + "name": "model.layers.24.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 13418496 + }, + { + "name": "model.layers.24.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 17088512 + }, + { + "name": "model.layers.24.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.24.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 24444928 + }, + { + "name": "model.layers.24.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 25755648 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26804224 + }, + { + "name": "model.layers.25.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26820608 + } + ], + "md5sum": "0c997f609fd44e7770fd124771421496" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4663d733b6b863472eab8554b83174f2" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.25.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "16da0a07eb9ff4e11e2e8b42fdf551f5" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "93fb9871c9669e2c72bbf4e5e8879c78" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "d28e1f3403430b913452ec32f7f4537e" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "afc08b0725f1157fb1d53487272ae7a4" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "15431e1cbaac5ba16c842159477a2f32" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ce72745c774e7c094664024f99227824" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "974a5045bd59d69c670454f235f46640" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.25.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.25.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.25.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.26.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.26.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.26.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.26.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.26.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.27.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "59f872a77ee3b7e45c42b4c323302919" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8d9970ea5695a126d1536dba6a7f5ec9" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "39eafea562df2a5ceb7fcf21897896c7" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "77a32e698f40d5472005e089f893ef81" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "791c1e45b9e2d657db1faaac6b887083" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1532db18778b67e5c5e7676a9c737c55" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.28.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "00927663ebfcf61af2907e59362ae58e" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "185afd3fb699c021e291099c0a38d7f7" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2969c1423647885127380f9ddddedacb" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "12f2c88470f85706847dbf687fe7e7c2" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.27.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.27.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.27.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.28.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.28.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.28.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.28.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.28.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.29.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.29.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "e64ca288ab0a2d77627406946cc8054d" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.29.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bb597add15cda85714890bd803712cd2" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c62b97b056f2a2b8c01319957c82190c" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "bd0aab9daac986182e8c6a1d573aeaba" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "5c47dd63fc952ef3b20433de0532c46d" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.30.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "34d21e3f2fa57455c81ea8bd0c951cba" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e0638ba0a1b31900a754f8b4756b16d8" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "c23d4db5fec8c8262dea715768d429d0" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "bfd6f7c110d7f638c06ccdbfd404292d" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 32817152, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.29.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.29.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.30.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.30.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.30.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.30.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.30.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.31.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.31.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 25477120 + } + ], + "md5sum": "7fc9a6fcbc061712387aea0d8d79bfb6" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.31.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3377c652b7947a8779fcb825a124d6dd" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "0e562d9fe7a780f238f1963ffb3aef2e" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a93fd0e453b3858877672089ec190d70" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.32.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "cb56021bd2ebbf01533229cf7da71dda" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.32.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "295017ccd030c6465e6f9f4148b863f5" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e5858146aa76940994b5ff9fdb0229a4" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "45d3349c4f19f5315f2795f4f1777d30" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "86f5729b4febad86d0c5a3102a7228e3" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.33.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f2471243f3c41b4d037f22f21c29018c" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "bb4c0980fd073d3cd82b72859a5d2003" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 29196288, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 0 + }, + { + "name": "model.layers.31.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 1310720 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.31.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2375680 + }, + { + "name": "model.layers.32.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2392064 + }, + { + "name": "model.layers.32.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2408448 + }, + { + "name": "model.layers.32.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6078464 + }, + { + "name": "model.layers.32.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13418496 + }, + { + "name": "model.layers.32.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 13434880 + }, + { + "name": "model.layers.32.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 14745600 + }, + { + "name": "model.layers.33.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15794176 + }, + { + "name": "model.layers.33.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 15810560 + }, + { + "name": "model.layers.33.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 19480576 + }, + { + "name": "model.layers.33.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26820608 + }, + { + "name": "model.layers.33.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 26836992 + }, + { + "name": "model.layers.33.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 28147712 + } + ], + "md5sum": "1c8a135f82d939e3710435acde44cd5e" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.34.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "2464186b085595e1823554f265d3029d" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.34.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0e69f17fcb15ca19095227d19febcdbf" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "18462f370054075105ed9f9c856b4d17" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "bbf2604c6486780edf6d85ef1013067f" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "c6919f02cf8e6389b99d646422060b56" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.35.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7134a0b5da2f31685532ae6e8905c8d8" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.35.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "050cc916aab9db40f95c239811c28428" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "7ebe268884c952c68a044b433e646ddb" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "2782897d6a93c1f8f577653a0f58de5d" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 30490624, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.34.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.34.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.34.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.34.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9715712 + }, + { + "name": "model.layers.34.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.35.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13402112 + }, + { + "name": "model.layers.35.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 13418496 + }, + { + "name": "model.layers.35.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 17088512 + }, + { + "name": "model.layers.35.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.35.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 24444928 + }, + { + "name": "model.layers.35.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 25755648 + }, + { + "name": "model.layers.36.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26804224 + }, + { + "name": "model.layers.36.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26820608 + } + ], + "md5sum": "23ef91b2760197134016331f3127b176" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "bcea0aa1d5114a8cc9e0f5a8f01c0f0c" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.36.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2872e98c9340973c5b7f48173eecc27e" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.37.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "89e7a172f180ad17486ba1ef0f32661f" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.37.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "aa7b18257721bc2d12878d6be6e506bd" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c8dc27111621bd20f6ee4f7a82a4a3f3" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "81acabf88fc63dcce5cfd079d6070cd9" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f995db5e4b30f36c4239a105ba64868d" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5a2f411dc7c53b49690f663f8dfe5faa" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.36.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.36.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.36.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.37.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.37.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.37.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.37.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.37.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.37.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.38.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.38.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "c45bdd15806391a392a758bd1f23020c" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.38.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "c826963d22d1a25a3e75d4c68d1e8586" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.38.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f9bf34fa6c07391207497fa2460417bd" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.39.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "75beae32aa3e622b728208f997c859de" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "234c4b659daee5c288fcb6a72ccf0de4" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3cac40cbdaf1b2929d8f6d2e5ed0f91f" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.39.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c3b077c535f7feeb323902d66837d739" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.40.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "838fc9831170876bc3065d17dd8daa19" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c192e7944f8cbb13f0fb125542311b77" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "25e728112dde9b61ba13c428cbee8c0a" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.38.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.38.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.38.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.39.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.39.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.39.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.39.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.39.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.39.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.40.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.4.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "ef3756c61d09940b77e620e3c27bfd6a" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c6dd71e5db5f49925206ff3c4ab34ba3" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "bc1cd9af077e53b2bf4131e61b622349" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e8b54f5e29eff139cd679e56b9754c59" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c0353c4a35c5f09cdf546a8fb9868fb6" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9d6949dea0f5a27567046f9542d593a3" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "1b86008f60aebde99e19a040a4e16c34" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8aa2af8430cd7b521d4ad88c0ed678f2" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c424528dad1d732f494782338617f63d" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.4.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.5.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.5.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.5.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.5.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.5.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.6.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.6.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.6.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.6.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "524b28b24bebd810febd852f250df9b5" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a6dd04f69e197a89446c67f850feb5d1" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.40.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "007bc0099bcb00d042632ad6b6f26574" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.40.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "21ac5ffcb4da5bbf89fe7c2346ae7a2f" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.40.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9395c2f45f506c8ab0960eaa3ad5a206" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.41.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3c31460f949db2db5332e84c6833325c" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "42e8d0a25e8186d76c3d23644854fa44" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.41.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1f665af0a917d13af70d3bf8df0de2cc" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.41.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0a99049d8e4c939a3a9b76e9cb910d7f" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3fa33fc63a4528b7a3d122bd3d986c07" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "fcd51b0e34176263a3fe66cc6100a7c2" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.7.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.40.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.40.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.40.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.40.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.40.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.41.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.41.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.41.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.41.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.41.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.41.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.42.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "0aced6ec132e5a579419ae33390f6090" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.42.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "c5bcf4c1a716c488c9f02ad680686639" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.42.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ecebde62a42541dcf4fc5faf04ff55d3" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.43.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "0ddf0f740ef9c6f8df6564d77c2ab402" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "932b85f0c1eb7e604db6d6b3e40eeff6" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.43.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "df4f51e223d3fbcd722d674b17b85b72" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.43.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4e17ee1aae920da61040de20c942e809" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.44.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b6e94af2ee42fd9790798cd0ddfdf85f" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "33db141ebeac57146df0af670aef18a6" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.42.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.42.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.42.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.42.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.43.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.43.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.43.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.43.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.43.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.43.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.44.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.44.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "2bc6d0ea37ca9bbb3c227dd670511409" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.44.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "32ca45f8f98bcf29a6ef5da084a2b3e1" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.44.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e6a6601776abbd14b09a133ef5dd569c" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "72d3d57b65fa4cd2a277167bf9bf6829" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.45.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b0bb6195e7884950a91d9925e20aeb0b" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.45.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6cc4807eed1349104fd28160fad7e631" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "6d4abed9881234788150b5edc5b1cbbc" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.46.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3a9fcf6332786f36e7cc54c1c8f02cb2" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e20d5c9975b750c415dabc80e7957401" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.44.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.44.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.44.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.45.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.45.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.45.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.45.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.45.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.45.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.46.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.46.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "ce4bd8fecedadaf835ba3fee134ec186" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.46.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "433ab37263ece443ee3c28f1a95a623e" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.46.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ed26d6c68fb958bd9ae4cecb7a58f83c" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.47.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "936638a30e6702e2793138f624629c27" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "c000057abc4ffad2dbbb48bd4f197fe9" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.47.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "56648df5027134d9084144b5880669a9" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.47.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "51d5762944d32e4d1487c48eee4f1d17" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.48.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8f10f8bedbedbfcdcd72c8a07b0854bc" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.48.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6db733fcab6507bda496c3100274d280" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "1bf7ad7387ba1e3c233ec7b77cc9063b" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "f10e732250d045c0a89c7400bf81ba5e" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.46.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.46.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.46.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.47.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.47.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.47.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.47.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.47.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.47.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.48.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.48.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.48.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.48.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "e142d92f388a664851dc507d6c76aefc" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "29bae3b62083c39b78c1ae447438ed6b" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "71cf4e1d3c705e24a610f0ad5f29d2dd" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.49.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "790b0b646a0a79a234f97bf91faee87d" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.49.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "7dfd52df71947ebb319f2d4073df34d9" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.50.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "98eb45f227f35655f4cfbf7bd5011ba6" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "1c8b4e7cc8cb93be0e5ec65431de17fe" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.50.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "d1ab90b450c3d87b05cd1f778e751e58" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a691e0de61a67925761ddbda160067a9" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.48.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.49.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.49.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.49.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.49.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.49.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.49.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.50.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.50.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.50.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.50.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.50.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "65c4acfb580882ab2896e6692d62c39c" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.51.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "6e9434cdd79e4e0cfe6c101f135187ab" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.51.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ea6abded8d1b7d2acd268650f7dd4489" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "bd71205d5177b0866e387afa10db7816" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.51.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "dc6ed92ee858776ebf72fdd72aee82dd" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "cd98b15d42e4a5a8f6f229787a5fddb5" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d41202bb9b3d09f6676b79cc2b6e57fe" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.52.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b8ad45e2ac9716818a10e8b8a4c6f832" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.52.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "339dc6d977c497afebf968616d3d674c" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.53.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "84f2de941e6fdd7088fed2743f392e3f" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "1915b8879ca438c549cc6689093802bc" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.51.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.51.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.51.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.51.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.51.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.51.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.52.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.52.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.52.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.52.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.52.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.52.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.53.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "4931483cdb2adbe14da2f5c34657b214" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.53.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "38cf9b231d89e347544de8747ffc37ea" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.53.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c8f78c17c0c479e1c87598aa92cdb1b9" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.54.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "924aa14eef39925da99f3bf8cd838955" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.54.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "0184a2a95b26a1cb956f915c8cfd7fe8" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.54.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "591e2781d81e0dfec20bc2e123524cd3" + }, + { + "dataPath": "params_shard_242.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.54.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2db7c99e5245c420f5c4f3d0a6439552" + }, + { + "dataPath": "params_shard_243.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.55.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "26f8ccb72e1ace2d442ad1d622cd3417" + }, + { + "dataPath": "params_shard_244.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ed7eaa4bd8b058e684035bfb36f26f12" + }, + { + "dataPath": "params_shard_245.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.53.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.53.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.53.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.53.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.54.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.54.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.54.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.54.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.54.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.54.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.55.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.55.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "e0a9fd76b3f017559938996902c2b0b3" + }, + { + "dataPath": "params_shard_246.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.55.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "ce4ca479d943d06e729c1572996877bf" + }, + { + "dataPath": "params_shard_247.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.55.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5bca160fc0db7f86286e2498424b4ecf" + }, + { + "dataPath": "params_shard_248.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "63fc0505ac44d485d77462ff7d00fdd3" + }, + { + "dataPath": "params_shard_249.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.56.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "fb581f9ad7e15603e91aba3c78571aab" + }, + { + "dataPath": "params_shard_250.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.56.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "29e801813798f75d407a6315b6f01d96" + }, + { + "dataPath": "params_shard_251.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.56.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9aaf7dad94faba4f3d356d6daea7519f" + }, + { + "dataPath": "params_shard_252.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "206a81dd9e934130303eb22c484cd245" + }, + { + "dataPath": "params_shard_253.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "32aef920f1c4a3ccdc13e13c5d503f19" + }, + { + "dataPath": "params_shard_254.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.55.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.55.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.55.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.56.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.56.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.56.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.56.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.56.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.56.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.57.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.57.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "8d7c600d10d19c5b0fb9e53be77c6b8e" + }, + { + "dataPath": "params_shard_255.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.57.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "c4cfe5926ed035733948ab4926604bca" + }, + { + "dataPath": "params_shard_256.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.57.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f0669876921c273c771bf838b3f9dfe4" + }, + { + "dataPath": "params_shard_257.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.58.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "86b01e5281b807b4bec63e95dede1c3f" + }, + { + "dataPath": "params_shard_258.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ff3418763e83d7cb8d8bffee086c8711" + }, + { + "dataPath": "params_shard_259.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.58.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "9a1674d242d71caffda35d4044e2e6d4" + }, + { + "dataPath": "params_shard_260.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.58.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a087457f274ce3efa70a6b082f95db0f" + }, + { + "dataPath": "params_shard_261.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.59.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3e947d986d7f68b02026a813966d6a75" + }, + { + "dataPath": "params_shard_262.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.59.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2ba2a7dbc00e86e3a510d2041f6deb45" + }, + { + "dataPath": "params_shard_263.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2bcdee34cee1ec2ff10a5b46ddc7e68f" + }, + { + "dataPath": "params_shard_264.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "1f3e09f5b7c5e63209dcbf9f39be1ac7" + }, + { + "dataPath": "params_shard_265.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.57.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.57.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.57.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.58.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.58.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.58.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.58.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.58.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.58.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.59.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.59.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.59.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.59.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "fb959746a3bf5517c9f2655d57a16a1b" + }, + { + "dataPath": "params_shard_266.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.60.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "27ea1a7501b47563757cd96c7460ef39" + }, + { + "dataPath": "params_shard_267.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d526356a1e2650460ba0db853b6fcffc" + }, + { + "dataPath": "params_shard_268.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.60.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "497d49d7251862c72c14ce1b2297fcfe" + }, + { + "dataPath": "params_shard_269.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.60.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2abf0a56395284422367ab7fc159fdd0" + }, + { + "dataPath": "params_shard_270.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.61.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "6c2be5cd8e48a5fc5d192ddc63ddc665" + }, + { + "dataPath": "params_shard_271.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "75390dce32f019f66a1f832ba7a50c0e" + }, + { + "dataPath": "params_shard_272.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.61.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3c10070dd5cfd06c28c6aadbd4f30f3d" + }, + { + "dataPath": "params_shard_273.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "90c15c3bcd5e58f38dcf17c3a6e436b2" + }, + { + "dataPath": "params_shard_274.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.59.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.60.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.60.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.60.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.60.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.60.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.60.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.61.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.61.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.61.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.61.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.61.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "ab54ccaa04e79a0fa3148d2278de5e91" + }, + { + "dataPath": "params_shard_275.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.62.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "dcb2755fd9c420f63ec3b104b47a0c15" + }, + { + "dataPath": "params_shard_276.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.62.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "00cb242a6812248d1f67ecd4edeb893f" + }, + { + "dataPath": "params_shard_277.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a20ababb2ab9a31237bd38bebdaef437" + }, + { + "dataPath": "params_shard_278.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.62.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "09b31afe918501ce2b9ddbdb429667d0" + }, + { + "dataPath": "params_shard_279.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.63.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "42e46f42c8c9e18ebcd417ac5c0365af" + }, + { + "dataPath": "params_shard_280.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "bda44f588564533538efc5e8a560df68" + }, + { + "dataPath": "params_shard_281.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.63.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "cd6e2902c36489d7038a6ae863b1ade8" + }, + { + "dataPath": "params_shard_282.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.63.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2419629c93b01b3505be69eca7ba741a" + }, + { + "dataPath": "params_shard_283.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.64.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "548dfdda7b7bdea46e706e64ac4f7da2" + }, + { + "dataPath": "params_shard_284.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "11206a49582fcc69a28989df290726aa" + }, + { + "dataPath": "params_shard_285.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.62.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.62.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.62.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.62.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.62.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.62.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.63.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.63.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.63.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.63.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.63.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.63.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.64.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "82ca679049a1e5097c214e7fe8abd6bd" + }, + { + "dataPath": "params_shard_286.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.64.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4c8ed961aa7d1e22d01f75041ece9e04" + }, + { + "dataPath": "params_shard_287.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.64.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "fd117d6edb79ca859383c33fb4c49a01" + }, + { + "dataPath": "params_shard_288.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.65.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5eb350bc14c47bb74fdad1032fbe23df" + }, + { + "dataPath": "params_shard_289.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "52d56b07ba965eb0b17261fb030b7ba0" + }, + { + "dataPath": "params_shard_290.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.65.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "2a164be4504de844a53fd4dacec9fdde" + }, + { + "dataPath": "params_shard_291.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.65.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "401d5d6ea1724b2ef5770cf30e6b6571" + }, + { + "dataPath": "params_shard_292.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.66.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5d8f00629686623ac722842cc1d851a2" + }, + { + "dataPath": "params_shard_293.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d00c55e927af6f2ef990be12411d5196" + }, + { + "dataPath": "params_shard_294.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.64.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.64.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.64.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.64.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.65.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.65.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.65.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.65.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.65.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.65.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.66.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.66.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "bb828b260bedffdffc62b9c5806257d8" + }, + { + "dataPath": "params_shard_295.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.66.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e47feceee237d279906db2df0c89d31c" + }, + { + "dataPath": "params_shard_296.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.66.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "17ca704ca685ce2bcc858472543afbe9" + }, + { + "dataPath": "params_shard_297.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ef57c83fb99d46279cdd2e4dd719b16b" + }, + { + "dataPath": "params_shard_298.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.67.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "441e5a67c328628c0ced18d525af1184" + }, + { + "dataPath": "params_shard_299.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.67.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a605a27d8bff1b521919ba165f1196c2" + }, + { + "dataPath": "params_shard_300.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.67.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "7d6f6599fec9687046afb4c9580f6d0c" + }, + { + "dataPath": "params_shard_301.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.68.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "de0fb23d745d52cc480f5f7470685d95" + }, + { + "dataPath": "params_shard_302.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e9b857c4e4e280816184ddcdd1299b06" + }, + { + "dataPath": "params_shard_303.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.66.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.66.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.66.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.67.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.67.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.67.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.67.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.67.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.67.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.68.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.68.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "71817ce6be6f787efe9bbe0b88d6f4ca" + }, + { + "dataPath": "params_shard_304.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.68.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "5f0a33af894ae0a56da82c06f5a79600" + }, + { + "dataPath": "params_shard_305.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.68.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "32ae23b6e3caea4fc5246aca49ef3da3" + }, + { + "dataPath": "params_shard_306.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.69.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b4f90e3995f559d222f7b954c2803e11" + }, + { + "dataPath": "params_shard_307.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "53b66f34862e2691a861e9651c91d8c5" + }, + { + "dataPath": "params_shard_308.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.69.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "bb9481f9f21f721a4afc902dccab6906" + }, + { + "dataPath": "params_shard_309.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.69.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6a0fc12629d1ecffafb68465511bfd40" + }, + { + "dataPath": "params_shard_310.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.70.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b11171824779130af654a9f4e924ac92" + }, + { + "dataPath": "params_shard_311.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.70.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "aab22d1ea69a25413cdd2c9338630f61" + }, + { + "dataPath": "params_shard_312.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e016d02c69b6e001e36c2400053e6463" + }, + { + "dataPath": "params_shard_313.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e70aeac8ec56fbaad1efda97371892de" + }, + { + "dataPath": "params_shard_314.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.68.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.68.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.68.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.69.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.69.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.69.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.69.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.69.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.69.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.70.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.70.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.7.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "7e494d5d4927765aca6205e16c605901" + }, + { + "dataPath": "params_shard_315.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.7.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0d6c69e26423107b385540e2c5a85ecc" + }, + { + "dataPath": "params_shard_316.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "a7ec584c19ef5abb16aef8cc28865b93" + }, + { + "dataPath": "params_shard_317.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d172fde4fe457af144b17c201e425863" + }, + { + "dataPath": "params_shard_318.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "f1bb7c700847b3f428487cb43a9e6f3e" + }, + { + "dataPath": "params_shard_319.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "66c9c6a95c6f6d83c91a155548912f9c" + }, + { + "dataPath": "params_shard_320.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "363483e66999506be0bf55f12dc9d343" + }, + { + "dataPath": "params_shard_321.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "011ccb5bbcc055edf27ec512d1f9c572" + }, + { + "dataPath": "params_shard_322.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.9.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "002b06578c697b0d580179c6c0ae45e7" + }, + { + "dataPath": "params_shard_323.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.70.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ec8f8170763c1df518e471200238302e" + }, + { + "dataPath": "params_shard_324.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "c3285a985f2d5968904a3581e3d295eb" + }, + { + "dataPath": "params_shard_325.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.7.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.7.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.8.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.8.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.8.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.8.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.8.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.9.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.9.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25477120 + }, + { + "name": "model.layers.9.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26787840 + }, + { + "name": "model.layers.70.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27836416 + }, + { + "name": "model.layers.70.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "94d6be65fb564c792f79477de8348e89" + }, + { + "dataPath": "params_shard_326.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.71.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d499e921b868c57337a40b5e4567cbb5" + }, + { + "dataPath": "params_shard_327.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9e473164e368d7a6608c4dcdbf3f4e70" + }, + { + "dataPath": "params_shard_328.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.71.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "422d4d22894d26fa27e18aa5b8ff2153" + }, + { + "dataPath": "params_shard_329.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.71.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2a9008d3684f47bf7584b7fd8dccb9bd" + }, + { + "dataPath": "params_shard_330.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.72.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d551c573fe158791ef607f99e1335bf4" + }, + { + "dataPath": "params_shard_331.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "4d8ddcaa3e0ae6ebcfc23e72d606526a" + }, + { + "dataPath": "params_shard_332.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.72.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e55d7e8ae84c0415a57da1d04ce030cc" + }, + { + "dataPath": "params_shard_333.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "49f45fd9c20ad61df130502b594a747d" + }, + { + "dataPath": "params_shard_334.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.70.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.71.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.71.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.71.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.71.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.71.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.71.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.72.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.72.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.72.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.72.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.72.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "fe062af2ad056762b6f62ca2f41ae99f" + }, + { + "dataPath": "params_shard_335.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.73.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a05a9b38ce653f175bd516e518cca02a" + }, + { + "dataPath": "params_shard_336.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "4cf2d488c83e25a77ed52b62909e9743" + }, + { + "dataPath": "params_shard_337.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "86bb7c308c361b913f8a70a09b38383e" + }, + { + "dataPath": "params_shard_338.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.73.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "60bdb4e85f228f942a57899b26102700" + }, + { + "dataPath": "params_shard_339.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.74.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "461adaa60ce741d00904deb7455fe699" + }, + { + "dataPath": "params_shard_340.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7c438dd9ee4c966d36dd9df33f74f706" + }, + { + "dataPath": "params_shard_341.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.74.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "03ffd4a40257f12f73aa958cc5f885ff" + }, + { + "dataPath": "params_shard_342.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.74.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bd209916cbcbfdec8d7162a9d8e5650f" + }, + { + "dataPath": "params_shard_343.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.75.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9cbfde261c3a603c929efd2cadece7e5" + }, + { + "dataPath": "params_shard_344.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9e6707c455195f4a2f118bb73eff1228" + }, + { + "dataPath": "params_shard_345.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.73.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.73.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.73.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.73.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.73.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.73.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.74.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.74.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.74.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.74.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.74.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.74.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.75.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "53ace84587da37ea76bd089a2750b398" + }, + { + "dataPath": "params_shard_346.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.75.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "02f613bf9e238c4478c4d8c6ce27c6b2" + }, + { + "dataPath": "params_shard_347.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.75.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4f7cbbd00966e6c713bfb390b2d9fd89" + }, + { + "dataPath": "params_shard_348.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "8becf49f49891f37c7c85983e54dac26" + }, + { + "dataPath": "params_shard_349.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "561071b675d91719dde7a7d355a1ffc2" + }, + { + "dataPath": "params_shard_350.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.76.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "d0887b8c1e802678ea66b00dc5b20095" + }, + { + "dataPath": "params_shard_351.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.76.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "44aadc08fc7aba695d1b6a8831a01299" + }, + { + "dataPath": "params_shard_352.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.77.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9d22fbf43fbd15319797f1300a97d580" + }, + { + "dataPath": "params_shard_353.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "82bca534904e8cdc7bd30a63c26f17b1" + }, + { + "dataPath": "params_shard_354.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.75.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.75.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.75.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.75.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.76.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.76.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.76.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.76.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.76.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.76.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.77.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.77.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "2991b658ef69d55c2b569d284ae7dafb" + }, + { + "dataPath": "params_shard_355.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.77.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a396385c8e03960a570997f1e1bbc92b" + }, + { + "dataPath": "params_shard_356.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.77.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9226ccc8ceb797ca826f815c73a5bce4" + }, + { + "dataPath": "params_shard_357.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.78.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8e22cc94f7505466a1c0496707316856" + }, + { + "dataPath": "params_shard_358.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.78.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "d6ecba2346ee124625ae1c6fd43b9c29" + }, + { + "dataPath": "params_shard_359.bin", + "format": "raw-shard", + "nbytes": 12075008, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.77.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.77.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.77.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.78.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.78.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + } + ], + "md5sum": "8c1086647ed476abc49df2a716e4346c" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ffc78a3939a803a9364a189aebd9867602de4a9 --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cacd6e0bb8daa6442991f80feb118080dcc96d4455532bc27fdafedc784b785 +size 525336576 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fc781bbd0fa9bc71782ba15ba0825c9691efe3d --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8876ae828b8b8bb4e336372e4cfe5cde9ac47747903a7daf8b048399b99c5beb +size 117440512 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..64c43d20acc66e2b28694c1eaef882102a2bc2fd --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e00b1dc78de7791fc8cf1506a883549c31d38b6974b03228576cc66f4d5778f +size 234881024 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3e20ffd1b2b86391b249f2de6eb58fed0cf28e2 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2485c1dbe48246763e718811f9afe32263e32b415f261d55c1463b2b951025e4 +size 41943040 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..af798c4b4ffa45010f496283effceeab7a56150b --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e37a1e6d4ae15d2978d438dff252b1b059c3b863d3886199f9ced2493312443 +size 33554432 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd17714c4dfa3662e878a4bbb78ab6424f34f2ca --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2356559f9933e03c01424fb2b3a5b14c24b9fdf6dfa9a609eb4989ee6c9c2d8b +size 41943040 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2b44967627df775e63fe30b5d6baa2b843f16e1 --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f14010a682379b9bbb3eb648a70c8d719076b6df6043302f8c938ebee2aef0 +size 33554432 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..70c035e0f594f7a6204d09aedf023a9890434324 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8985749d662e207c958dcb6c06ef92c91828467c26611640e035b57ac94e881 +size 117440512 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ae9d4a3b11aca819736980e122cd92e20f48ce7 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17393e1c3b429407a661cc8b07dc396ac9d54adb506f590c2d2cce3f96eac0f +size 234881024 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a2ff1f23875912790b71fbc5c01edbbdc20a3a5 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28b0742baab27782e6c5b5920da4503a7d627ec99408d31903250b6f4bd7345 +size 117440512 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..931b0c71a4451804fb325d819311f8e09ff1bcb0 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b7f3145392e0eda4c3dce4fbce1ef4665ba5590634658eff429753235a40bf +size 234881024 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb80d912c63165cc092c106c703be579eb720e3f --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0527235048510c697dd49af81770dfdd7a4fc645f8da7c0d883f62f5b111f79 +size 26804224 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bf53096c98a8e4f777107c93d8ccbb105c8d97b --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f8365f70f95e76ef74c159e22af730a97086f1db6203ea1ab1affdde5a07a3 +size 41943040 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c0fef0704202aac1669d3010ad3e609d7907b4b --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b492b805da64806bcb8ffb4981f957f44d997be5d30e654bbf108a5957681bb1 +size 29835264 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..a102785d36495143354cf801a1a30ecff7c33c65 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8488a5a8fdddc64c1c5ef96e32072bb8ddd90f0e1f75efff77ba9f174249e07 +size 33554432 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..15924a9ec9906d0ef330cd913b5f7b3a299ccd22 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d5a662ab326ee7384c361ce64a4cc12997c2963fa681b0f80399a4be13c381 +size 117440512 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..47f0a4a60c34731f443c6c67a1d9b5039a531282 --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff3c88e9188330b3d80cab57301ff018b914d019ed8c59a85a2878cb0854a01 +size 234881024 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..1938d0f6ab943c7f61493869ba026331451968c5 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c06ad7131d275a1f902c7041892396b060b0ec3f2121e13c25a6fcc9dcbbb5 +size 41943040 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc5f744f570b9300d853e28c47fb240cbcf1b34d --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3baae1db93a160feff7b1fa2f88564b6b23b58642a59722d1b373f3576aecb2a +size 33554432 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..bdbb2254dd33880368dfdbd08965445ac9cd1937 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b9f6a5757ec76a6eb7df8004ebd6480904d804e470f33aa9073c15a08feaad +size 41943040 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4b20cc2601817d0eef9a8e0949b21468c7d962a --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee9353d570b75f45ef3520be548426891461ed4977f2a8948bac6e0f3d1e0480 +size 117440512 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..38353d6d7f8399fce63a419ecd32f557dfd76e52 --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce37d4f647fb32c301ebcba78a7cb12806b1cb8dd0373416e0a9cef35ef2b14 +size 234881024 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..059902ebbd9d02aa428e0d096c55f943a20f6db6 --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b51fdb81d6a5db6d56119877505ecbb98bb5ef0e95aca6a766b9cb88ab33a7d +size 28114944 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..37502bbfc2c4ab50e4c12b0fb20bc06a7e0576e1 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34d169a2ca064ea7f8c298ae009b0cfc4b3a1c9dc11787b3c906ffcf2150697 +size 33554432 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..e775e6b02aab3d713863dd8efa8fa02f42a867cc --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6033b06aefe5c17111f243e0901b93c6cdd829853664486bbf1d15c6af32b75 +size 41943040 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..50b440c19a9d9e1374ac8660060f3d17d53a1cda --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a40f1614c03411c6b9e92182c1e242bfcbf0906b53e6ae5bbf5b02af2051fa +size 117440512 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..30007244fba59bfef38461c02f175ab06d77c272 --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0132074b88411b23012ba2b11da2d76ace1f8b2dba8190d2af99f7e2922d0647 +size 234881024 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..66d35f261187961b6110fb9468c62f5aaf0d3792 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a340b25d6a033e8e07b21803c8dd3aac7a0dc8eecb9ba9e093bafae2a11a9674 +size 41943040 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..285d7a3a71ac453b0570dc4f1703c1118e63056c --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833ec7ea100a3bf4a56af2900c005360d5422f71883fd08da23a03b2cffe1963 +size 33554432 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a5c145232ef51a542af34cd932e1a553b2ea96c --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79bc5ec88e8df427ec0295f741f025a194014390c3851f5d958efffe4b1f3cd +size 117440512 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..b3ca8272b74e2c2959338dbce1a0fb62399b7032 --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d6ea240064ca0a988881842c46933e8f66b0c3e664a8681ab0f3140b5bcb44 +size 234881024 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b214cbe70eeffa08b4011c20b6c7a2dc79e5964 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783d332890b39035d6c87c1e9550acf4a1d92b631741aae5bc5fdca8589f4bc4 +size 41943040 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..c9695e4c73cff7644cb44c528eb2faa8f383667b --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0922ff697c66dd971d06bcb124c96fa1e84d1c29631f3619998e0143a7c63d +size 32817152 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4e7d3a7686bdcac57a529f37ffb9862cb6330c3 --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395447cd353f2a98b5ed65d1baa848acd0377fdef6c28eb0d8143058aa02ca71 +size 33554432 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d94d1b3f9b11895fa136c78671f48520cf7efbb --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0263df8f55efeb8c723b81362e455ac923ce1df361e11fa5b5b178db1f26eb +size 117440512 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..750d7eabc36b6c47747a81f91912e55e52d05e09 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a5810d125da6c521d8f65db0ac235217f8cd9757a00eaad6bb373b561fcf1d +size 33554432 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..a916eb0b25e711b5566e9f14788438dea2ed4577 --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3192dc5e5ffbe14ce66774addad8e004a40c4f83a110f2c0b163c15711e9b2 +size 234881024 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6a218d3acb0580d1738e271a1eccc594c240bb8 --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46cd0f6b7784867033ad5ee284c27269e3fd87f205856c994831ce1d09ac947 +size 41943040 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..18493535785ed423b8a99fc2e5f640eb72f1e5e9 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c438f5b1847c6117ec5d8267a85ff7806e173e821e680bdcef44df5dbd76cd6 +size 33554432 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..657230a59a000e285cd75546f54bb55d3ec6b501 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9533375366ae83bc7fd9762e0a40d6d3632f13bf64ad052d19aebba4e5a3c165 +size 117440512 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..154945b9df78c72d26b560c3ffa5aeac40bae327 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71fbd5eaf3d435992fa29638b2a02ee0c033ac0593cecf3d70abab5f57e533d +size 234881024 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..6933796407b053e848a78952ca0fbade935d2b8b --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59218c3405bce144b005545d298596e264cbed4b2a949927dbeb37fb793b7eb5 +size 41943040 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..b29753a1c0131a69a637ec83337321ac38954a8b --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f9c0820f09ebf83c6b861a276094830f88090ef9d435f68c71cff0a3b1c492 +size 33554432 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..42ce6db75b9e3122290fa1bfd5a4e74593619b4e --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b1db40741bdd260e9a8a0c4b0e8bd822625914605b55ba47b86a3b9acda11a +size 234881024 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ab53d8ae6b261ec3c5acd72b0132c6e90683bc4 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59485d942badd6487453e0c74eaa244da580bdd5d8ccf6148fc0ae77d667249 +size 29196288 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..e447cd517c0cad53326829c79b898b6c2c232b36 --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f2ff59e698afbe8ccbefeafed7150bcf477673d123794c4f5fa9b9cbbd5e6b +size 41943040 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7d323584ab1d440ee7c668a5a60dca7a5367831 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda82bc9f2afd671a8332f3d442069e1e7c6a1e1d090157d9334eec795cd1d5b +size 234881024 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3fb127e2a9430613874cf1dd55e0264b7ec1b03 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d86ec19a109056e74881b884c9f15a25bbb140afc859b93cc0d7710d1a1a1905 +size 33554432 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..514f05438cee108205fbc2124394e2c1860c9bfc --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4092a44af8c46890b7b64e24c57ee9fa982a23470098d82ff830038d2a6fed +size 117440512 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..f41f476138ae534f8c66dce281c696eaf03fbb5d --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef284644bbfe44940a8eb24f3015285d9ffb2e2fdbd08bb2b1be404abefd3f2 +size 117440512 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a7eff80cabbabf85d77ab0dfed641ac98997657 --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686ed3bbb526854da71ac406e54ebe3671c31e8fd065a33fd95c9552b2cdf51c +size 234881024 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..49e82eb61a93f629730d677426133d3408d9d8d7 --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a253e360e417071ccb9ec886f65912fc66481fb0c03e3a9d7c8b618a4ac578 +size 41943040 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..52109abb2447eb128453a38e38d9e60b15423320 --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ef2bc57d15ccc0a18d3c887c9b9bf77096864f068b870ce6422ff6c986058e +size 33554432 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..1eb5bf2d14dd020930070d13b038cf436c9c0408 --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c592f3e4ea42fe984ceb6095d4508abf7a92c3d6c2f5e37d51b57d0d0efccfd2 +size 117440512 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3a975f888fa3071622610d81e2098a1bac4e507 --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:401292e78089c1229fe9c8b58a65476f3ccae16f1aa87bc3647102826ba65e7b +size 234881024 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..6650dc32e24bfcf84f4e193feae51c9ba4983093 --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b3007f46aa6b1b6d4713ca4e4641df82b372f3ebd0f04fb16d26d0b69e45d0 +size 30490624 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..42ed42cf37c0b40322e9d0c3a1e0faa149f03a12 --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35cd8b857b52521a92b8b5ce3c15a10f7d24190be8af0067c02faeac6c6e7f27 +size 41943040 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..133124ec23c1888a2edcf9234006bc47231b6172 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909b24427e6b406e6c2c5c63e1bde7998480e812bb18d098b8aa70787523c77f +size 41943040 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..aec455fd3839d611176a1b9432ff2e09b843c5e8 --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e33c47c18713746ce61455e1ca52653e88fd20db7f3fa2eab053df51cc4f8d +size 33554432 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..78d5173238d42371e39e02530720b32f92afa554 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21cfb04895bcdc23b0f45ca19b05beb997c82ff653bd028fc362ca3af11a693 +size 41943040 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e44a1817d9dc4c8079530f649d71b34f62c2a0d --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00305b85e12d46c8d1310b8b3cbe4ea8dd7b2fd5942e00ce50181a9c5dc17749 +size 33554432 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c37221de71ef6d4ba884f63759cf9f45503ffc9 --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9208ecc7420b72170082b46ef422d55eb20a4fcb9766955d61efbef323f715 +size 117440512 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..9721b4c6739283d9d97c1ccde1ee8275b5b3a231 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391cea3abbeef8e4f18ec0d073a8e84019ca261f47e95f1ca115fc29b1f6846c +size 234881024 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..b486d1c744e2769b739382fbff63a2f133917c93 --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4749da449e7c6a360ba6905928ed9afbf60a995309ff7b46f86b9a93cd07a4 +size 117440512 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..e16f2d57d96c1ad408b3f95b48f40120a7cbf2d2 --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ce7818eb18e3ca5a59080384a07f7ab42ee8c48f87d18a96a52e6a06ebb094 +size 234881024 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbcf94df883c8ac281591cfdd4aad33b7d2d9cb7 --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75a88d66074e5218c71dead5c0f529b7ab38133217e14165b9c0dab8adb4466 +size 26804224 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..81d014207bf73f802dd5092f26588c52c5bd69ec --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af87be79a15d313fb2b5ee05ff22450c1687e00256b4c56ba7e52cdf63fb250 +size 41943040 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea267f668fa6507a794c738f2f9d964ff80d0bd2 --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35076be2dfa7a52d16fb7ff204286cb58864fe0957e3056cdb352d43acfd57dc +size 33554432 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..1daeb34478ff42b41501b5f5ac4094d0dd2e6e17 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7292a88990c48bd22b2567f45c308421c7c64f5bf6b0446c23e015700fadf808 +size 33554432 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..0debd19bc8d525181e74f474cf7a8f3ef6db914f --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f4932558b0924061539c8e8fa86637463927053d9de119cfd265bb4de9b5a3 +size 117440512 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..080f3299edb27ece345fb82ec55d99af1d3df2f0 --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05c0ba369d5c4673c533e0b264b1fd5305e8c557c74fca3b085eb8fbe4fc2f2 +size 234881024 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..568fe983f99a9dcac75e9ea52412888963a3bc08 --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a741d8811ac817bc568b5f7c82e07449718fc46a188da3a85f859abddecd0a1e +size 41943040 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb607e94092394598935b723eb89897fb227b1f1 --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1528a901b32e78ad8fe1452f7e3ad4ca63e9ef31362a05f86b838671136e28 +size 33554432 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..77b85faf55d56dbc4ca2b335b7cb496cca892e3c --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac5bd5e1a1f35040b9a8504d6ffc8c29a6faaa3e991da7d23b78f4bc00606b79 +size 41943040 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..4385aca556ad1843df29596c91ab57e3d4aa7988 --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc0c740880ce4b217d2af68a3f7c1e1f1130c2aca090dfb4cd9e4850fc5a842 +size 117440512 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf6e3ec4ff27ab90dbbdec8cbab0b41b01235fd0 --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e105558556a77502627054d200a9d2bc1693da4ec3e29e07065c558d2364dc06 +size 234881024 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..270ed32636d8076b69f054ced302818fce48ade4 --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b1de9e7dff602d5801f1ae94e9a64d9a10cac81b61c8abab43de107787b9ea +size 28114944 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..25da8068a3574bcc0c02e6726388088f7c7c7e92 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a8e17a3cb1b803481c2732cf79074274d0c611475ec12c003d0b9c4f79f6dc +size 117440512 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..f986b82950ab19d5321bc7166c8e60f175b8f5b5 --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5606983e8b98041e981bbcba9d03286141283b4651689bb0e36b133c070e90c9 +size 234881024 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..8216d3a48ce2ea037046cb83fea6a760cf128737 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7a0fbd51f916061e108102d808c07035cc9a8098f818c80dfee608a5c90213 +size 117440512 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..53742faa4c9522cf168b0fa30ccac6681820a0c4 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f047cf4f87e08141676fb241fab3a692c611f4bf01133118cd2b1fce7e90cc36 +size 41943040 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c6276f239fab7fb6f867412858eb2c48cd3e244 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977ad683411661cdfe6de7814d188472cbe6dfb8d1cd2abde127612dfb25c8ea +size 33554432 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4f270049a34099e827ad24edebf1125e017c290 --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172d6fec482f6e8b59fd74f776a3f44e1ed6632eec82f01e6d636f42fdb9169f +size 117440512 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..a41298c851f2848ab0b7571f111f0b44417156cb --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06c0f29bad147f838fe6f4c6886947aa1e3e011250c9b75be37998d34d7a669 +size 234881024 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1bc4e0c8e0119bb0eeeb0d1d44bc50c794a0535 --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6872b1657925eeb1c24a68dbd553cb1a9c3a22c87eb73d7c31671910691d0c40 +size 41943040 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..44da91d7700fe642479d78759516f52110ecaf5a --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539cfe1bdb25c51526df5459e8727f86923428e291e6ad5278fcf40dbd87db57 +size 33554432 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7cd0ea25245103de04c9a47f97281b34ecd30b3 --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d767fbdde6a227abfaa749433bf4eb70529d9c26ac664d63a00c61df4a36e02 +size 33112064 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..3558a570c865d60d0c80ce115bbbd11fff4d9197 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e13b2d035e7d96f4e03165ff2c78e928fad91cf0c6c92346f95ecd550324ed0 +size 41943040 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..b59f3fdc9f2232873b48fdf239ba675f1553ce81 --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c620b714ef8070d24d9cf6e3795b5a0b3da533a7ae4b3aebb1ce8dc2c37067 +size 117440512 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8453fa57a66396755a6b45c3a234f00dcb73331 --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc54090ca4e7132a230e2982db14aa11fc50670fc7451016f624977d232391b1 +size 234881024 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..acbc2bf086066a58dee0f8cf1ac5bfa187563f14 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ef8d343db8922a295378d0a2da205ded31ecc6332c22aeba71fc12bb804676 +size 117440512 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e9cd54c8c8c66f54f15cff3df3ace523c28b260 --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f47ce2c43812626ed28b4939cdf5e65584ae67cb95e6813aa1b192fac3a770 +size 33554432 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc439f9e95baf9b0ebb033c0f392003e994f5528 --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4146b7bcaed6fed61e75c76890b9478e09f4a48c9d14d555f5e0814841fc958 +size 117440512 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..56a8d3196dfff8a18b7804aa3258256287902340 --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446d412ec142aa7fbd040f3a701e613024fd16c26b9811480a5c1c5a47a7eefb +size 234881024 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..1665c60053d02253938be4417811b5b52ba7d5e0 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d92039981487c73bb4339ff5e5d82eece7ae7e98c1e8539d56b4bbe2e76961 +size 41943040 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..c56a91d20ce2d36f412cf47e360e0db76299427e --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ad1ca88edb19b84ea80b7da17bbcc3e33e0daf7b94621721761d347c2cf044 +size 33554432 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f160d8db180bf3bd33805cdabaca31d9e4ba70e --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da180b69435598e15961e8223dbefe76f00c2b12d5c7919e3ac8c644bc9f2c22 +size 117440512 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..0eb16d54b3ce0a2f1785b338551c713b3c438581 --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847686563852e33c85bd71e91026f006b34226e04521553e97d79271b2e5e192 +size 234881024 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fbc169728d4ae45af945d5f61652a43f8d32916 --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b685057259a4cda5a3b8784810da5f0229513c3d74801b91a54563a8e53b55 +size 31522816 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f00381b0e888cc197b955d5fd3be274706ecbf9 --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a30b97044ee2af75b9dc6d7f2ad5db1a650bc1868e1d8df9db6d38de6dfebf9 +size 41943040 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4d45636171232590299a0b3e01ad7594795375d --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1099675cfdb19486bf85b030b413e7ae50e6286eb61989ebab569ff012face2f +size 33554432 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..3898ef404b1bc2ab9c036a4b2b7a415c78fd6351 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d051f4eec40251d423b466cbd3acaf790bc040a9b22a51b05d004a87b49bedd +size 234881024 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..50120b66a1b5dc439ac5f7520eb61937ccdc4bfe --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c9e042c2867b18fdf3e9dcf1cdd64e274dd1e75783af5f7a575b97d0bd8f87 +size 117440512 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b75b7f5e7144709c485d912bf11c85f80b454bc --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6710b6955cf44e04702741937953b33faa0f93b5d07029257c8779e3dc66edc4 +size 234881024 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..91727b5fbf6d4134d461a19e356b7b417c93c378 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c4f32d0a95a6fd634efc47bb3fa9c8f50121f882f1ad55749fffc11fa937d0 +size 41943040 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d8f159883821d50ea1e9ddd684a94841d9f61d9 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458f1ad09ddb9e3a9468ae7dc21fe98543532a3391792bc344d83d47ed0cb0f2 +size 33554432 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b79b6cae0db0f6f6364ab92286ebc04ec6b03ca --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64fc1b8aef19c4d872a474faa4771d76f74fa7d96da1ffc287bf983ce451045f +size 117440512 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..666645e9d8bed5e9f09c7a6efea0258b126ccd61 --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd398ae37f5969efd7ab159f5bb0ce5516eb6317b17380396c889b6552fbed3f +size 234881024 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..3885a46b43993cb476d2a0665ed5fe9cdb98ae22 --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1f4bf2108a5409258fafb15d2ac98157df1faaa57b5e622ca90f13a11c9724 +size 26820608 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..08d5287b0a1a54399a9b98973d666a762fc18150 --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83fb7688d5e81438713bf8afe10d10893d90ffbb467c4fd49fd97267171b95ba +size 41943040 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..6103df298e4d3b9af0060f82d352c4c1bec50089 --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04408f514860f977fa11e5327dd5b71b4828c814a8ac70aae7ee6c888138b433 +size 33554432 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e847c71c6d7d1e96fe80d416c0a92d44344accf --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f828a22afbd79747f04ec8d1bd6fb7d33d8e3037b6713d0446f2d6e6bf5d495 +size 234881024 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf07e357d20092ef7d9998fe7a15bcf341b2b952 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f0df50039409a76bcca1402feb4c4df0a6e276cc73615f111b3d3991eef2b5 +size 234881024 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..294d724a10591dbad3ef09ae4e2e350cd820d70f --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad1026ac02c73b7fe9f987f76bd82791e18be45f2bf56467d56e2758e5f0d29 +size 26804224 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..7330b5044dba7ce5744b7a413f5117f986bad7b0 --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510d684179fc3823bb65890fa8cb15b518414b08386b7981a5e00847eb1d2097 +size 41943040 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..4caf1cbc527c720db44f5b76668156a6d2df3bb0 --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b202490ed98fc11c9cc05c8661eb6a101bf05376f18f9ebfe4bf47893905280 +size 33554432 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..24a88da6c04d4e84d697c73c10decffa31f2ffa3 --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c67492bcd2ef33256544f22e70a719c2a8181a1f98fb596b11956bebce252c +size 117440512 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d8dc1744a74e1340e8d24fa539c6ad34369cfdf --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64a375b7193248acfb729934d9fdb1ad50d2704fa2892a497d99e3779a34d97 +size 117440512 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe402ad8de8a74bc5aa4d542a7d85d14840f6683 --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c35484f912357ed3117bb05190979237bfd51328b01f574735295259d3e7ec9 +size 234881024 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..54b62f0213c9ee7d2ae44b4b77914533ad793f51 --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485fb5e3a8ba4e4d78137cfa36464ef9b49efc0a390bcd1b2d9a40883aa60220 +size 26804224 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..b169a7c53689c1516fd032dbf4fee8cc35331b13 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ff36f694c9f6d36057a05696afe83b073e1a969d53c87ff049de689b0c91ea +size 41943040 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..b645a6cf29d49ec87965ed135460b067bc58b746 --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9594dee20b557191cdd66b5cfdad53149e9be856c2550a807adc95721ee56ab1 +size 33554432 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..58a3247bb7d635d3a7a689d12684047613f69dff --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82944b0a9dd82bb9c173a5ff615b1dbbf482fcf0463d8e04800d81cfef6a0b62 +size 117440512 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..801ab6c57e6b54e0b48092c0ebe9b44ecacd01b1 --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7172ae2b7a1cba6aaf40da0eebe0fd76db38afa0780ced93f4917bb4bb2668a +size 234881024 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..19be76dde1b0fa2defbcdd9527f52eeef61c2ca7 --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6e1dcb595cab657be8de4ddffdb7c4aada3596f6492e07c2ee4ddd45490604 +size 41943040 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..75fd07ae3220af7db0c7469e00c663ac1e60ade6 --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9a68b999c3fb1a33313292bc17fbe7770a1409d9372dc807a40986975c781b +size 41943040 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f6b7eec68bb92f54c8f3660053b01bb9928c336 --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acddaf97dfd70f9355550cb9507b176753ec3b0a2c469ed4af453e8ad0702594 +size 33554432 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..9909d7535627e0645756405a5c0daa05a63fdd6e --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c17a811ae524529335c6b15f88a58dfe1a99f48ce7a6b57b94f8a8602fcddd3 +size 41943040 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7a1925ad3effe462013b6c311f85eb8b5422bab --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c390dff687f03522ecd57d089ca41b098fb6525e56771db00d5d5d83ee329ae +size 33554432 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..477c301947cfd093617e38adb382d494ee4cc13c --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d9f8b399d65635478f09c2700a3c52f77d8a9bc6adc4f121924cdf2412e47b +size 117440512 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..c36c34ee04b212ff76d28e7ae92247c130dd38d7 --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54e75304d053de5908c29155f579613477a13797482c2ace2a22fdd4dadfa10 +size 234881024 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e36210d03c259231519ca0445e63bddff451155 --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d56881347e1466af428b34836291625b56ec177a2e9449bf2d8dc29d26f0b83 +size 29163520 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..55f08f1461ce95dcb659f43e5f079a2d7947f9bb --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f874f09f7ee6feaa985e3152c53f14d0dabac02a96459072264768875b051e51 +size 117440512 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cbd746bdf4ff0c758535f5863cf563b632b2dce --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3dff19213760ac7f0fc4c1e63b8bd2e757cd42c5ade09a8a38e9d7fb09b6fee +size 234881024 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..39a35828275bf0a84551cf2cabd32ce61212ce48 --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9332d48953bbfcf4166678f55be4e0f85116b47ef0b00335e113a775b5ad1156 +size 41943040 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..0745b983df3140460c9b187fbdc101d660962d89 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5f28f2c6b75e0d2cc7448e9f54d248fb41d20ea779cb96cf4d4402ba18a5d5 +size 33554432 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..92c770e9fe1762cfae7b13a0a98088471da425cf --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819aa86807d3dd1d196d8afde633c257922a71e994c523a09e2af3bf49906b6b +size 33554432 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..09cee5923e5940bf29f9e1636b8e58234b54a36a --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d2a367afb2e2529a2b40aa37e1e5a9da6ee23119647d625c3bbdfac95dff010 +size 117440512 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..627ecb74a7f4cc91633dd1fcf16552cebf8bd22c --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f8f03f464fdb7f0834304cc30da6ed1a2189789e645196eb91c9a5e987a788 +size 234881024 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1dae951818f81e63834e60282eab8e2d92ef5dc --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74e6d4dc69937e96299fece3de7a53d15bd890f4eb1764e54cbc258ceb509f6 +size 41943040 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..219f839aea1bc132ed7d975a9fdee07a3581e871 --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03472e11fe3bc6558d8ff8bd7ca793bdfbd0acbe88147c0235f0d0be42817652 +size 33554432 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..9af32a224a2569807b526702c5cdc6f0f3b47da4 --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0359419c3e93d2e8ee3079c9ce1fc76ae6090baad95ae3e0685828ed90d4524 +size 33112064 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..3bdbbca6f0660158f275c8a072d3836d26970efd --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965ce0e216b544cdf4f6df7c904babafe65e0d8bc3bc90e7a1bbc5ae0f2be191 +size 41943040 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..9136f29e394c054f4a3734c53d61f5eef4555596 --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:478f6a1bd5af8683f5a149d394c8fc83bd113ea8057930efa5937a1b25eca443 +size 117440512 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..c678d2c9338f960dce11784c5d0558acf8e6a738 --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac9f2de54fb0de086f8bc9402705273bc8a6df28b73d7fb3785eac3c373d39e +size 234881024 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..7beefdb01263d911eac1da1e38009a9bac401da6 --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c248c87d54589d8bca4bd546490aa05222e73154881ec047830f59326dd765 +size 33554432 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d562732d878f9cc391d0b12f460d2b8f559ed8d --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0254c7a5dc679c1a7d1f5f115a59453fa5bb2a351400007f6d11d1c5455f84de +size 117440512 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f8c579e6cc267a25348490101069760bef14cff --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eed4f691cb874af588f2a3a6e75fcb19eb7345bf6945e8607caa32f2f03d1c1 +size 117440512 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..adf6b37541b35f6ac84130aae4eec9700c27eeed --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e7a637a8ff14f07d36d286dbd2fd19a0f0175fa3f5067ac67ad665443e78a13 +size 234881024 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1797f810d0bc5cc58a2922cdf0acb7d76f3f2dc --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab44b76b45af440005332b6e988a905946df24ebf6c87d95ee73e5beb4d9f42 +size 41943040 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..adcae9b3c0eb3969e4048e632a0fad3b6531ce7f --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134c2930586ff176fdc7fe0c75c0743464ae3b1f5ef6f94bc62e7814691a38d9 +size 33554432 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ee65d77d823947f5d69a1df2d0c0d3de0683c9e --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f519c8178e26148ad311ff1660587bc5525cd3dea1315a947d99b7b5ae18c6 +size 117440512 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..21f39d73fe134d57aa02e2169bf6f9a9d4cb7a2b --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa38c821adb9ccafd887292a38f3ac00653bfa08ffb89f41349cb26e159a18bd +size 234881024 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..d54aeae486b3371a2b58c976ed9855a65b617308 --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb0c3cfc525acfe5b4c916d43fcf9ba3a7a57dcb3a32fe35b61909ab9a5b9a4 +size 31522816 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..f07f0f62fc0ce9ebc5fe22b743b54d635f530c8b --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72fdfca5d85dee255d4a4faefbb02c900a9fe4b0dac49606172c15f25b7a498f +size 41943040 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..df27a453c9c82a3b642609ffbb88bb3c38164670 --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe4f04eaadb39eee1875849513955e89099562d4dd9065a17314a70346470e97 +size 33554432 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ee6ec5b125c99941f96c6366d3f1b7d9992bf71 --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fb263685a3be568862b0c3a2cb78e6ef91945074dc82d0dcda0feecb0db224 +size 117440512 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..e64293b89aaa19f781a9a886e8a726e3408e939d --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033cd9016fc7507add85b6bdf4bedfade9ebb2c19807c4e411c9a09d3bb308d1 +size 234881024 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..6e6f7363d88ffa98cf5c00a8f723d030b23ceb2a --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eaad85f00f2a9554c8a21ddd3b9744c470d0e14fa7ef32bb8033e4a0dee5a07 +size 234881024 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..681256ba8d40fc98a4ea1b6f43f79521e74d3010 --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff1e7908c553aa5e50b275879b2f122be137c764c9e45b60d5008b019ecc068 +size 41943040 diff --git a/params_shard_242.bin b/params_shard_242.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc5fd7062d483947ad8d4fad9f8d62395bc094bf --- /dev/null +++ b/params_shard_242.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:519dc72a2b4ffaecfdac05b8abde99405f00c483ddb301314843137c61325d74 +size 33554432 diff --git a/params_shard_243.bin b/params_shard_243.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec1a0cbfd5a33290b5dea2706a22fe967080d309 --- /dev/null +++ b/params_shard_243.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19301c91d3f5bdeb8c4b7cbedc387d01aecd0862959907c5eafa2121fd5f4017 +size 117440512 diff --git a/params_shard_244.bin b/params_shard_244.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dd7d83aebbeafb76b1317d73d9292a690c24cf9 --- /dev/null +++ b/params_shard_244.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5cefdb0e6c2e233dfc16b67aa8a03522b0040426fbaa348400c8d6d0d1b977c +size 234881024 diff --git a/params_shard_245.bin b/params_shard_245.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4c045c7909fa399e56b02e9a879f5a41d1366a3 --- /dev/null +++ b/params_shard_245.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e4e1b0e2c58c1f033ecc397ac8a803af59a32f639b76f679bc3c476dad94e2 +size 26820608 diff --git a/params_shard_246.bin b/params_shard_246.bin new file mode 100644 index 0000000000000000000000000000000000000000..f6403510d0ed36f9364ba6947d210a4846c4459b --- /dev/null +++ b/params_shard_246.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac00e5247068d8f6fae19826f85f8d695942382a6a9403e6c7e0cc1eccb458b6 +size 41943040 diff --git a/params_shard_247.bin b/params_shard_247.bin new file mode 100644 index 0000000000000000000000000000000000000000..24d6c3b63541caf5e76aecbb0f30800933752a19 --- /dev/null +++ b/params_shard_247.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b0449a649e4d41cb2820353fccbe288801b9823fbfa8083c2e53ffbb59c81a +size 33554432 diff --git a/params_shard_248.bin b/params_shard_248.bin new file mode 100644 index 0000000000000000000000000000000000000000..56d6c8a62394db4f9fcc2570ac2988cb54b22ef0 --- /dev/null +++ b/params_shard_248.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da5b03ed92fe28693c7a216f718485245c0ecbd562527bd72178fc73b4991b2 +size 234881024 diff --git a/params_shard_249.bin b/params_shard_249.bin new file mode 100644 index 0000000000000000000000000000000000000000..d26fa1e6efe651acb09cfe7ac842ea656b847b3f --- /dev/null +++ b/params_shard_249.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e608538f1282084a42718e229aca941706372f8d335289b1212b080cf6f7951 +size 41943040 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..35a4007d717cbf88839af5e71b9af8def0f14536 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cdac12670b8a30e659719b0cb6624508b1976ec4f6925eb9850334094760c5 +size 41943040 diff --git a/params_shard_250.bin b/params_shard_250.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9964309848fd821b7f8d590180d92e3ca525a3e --- /dev/null +++ b/params_shard_250.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3f3c7e37232671e35c15d6082412ce10963a977a89b0eda44a74d2d70701e4 +size 33554432 diff --git a/params_shard_251.bin b/params_shard_251.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a7db27c4bd1aee845cf1d57b9b518988e8380e2 --- /dev/null +++ b/params_shard_251.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0344e2a50a7339a31191db95d6b7928cf9d9099637dc701a2cae0fe5ba9d082a +size 117440512 diff --git a/params_shard_252.bin b/params_shard_252.bin new file mode 100644 index 0000000000000000000000000000000000000000..5894fdc88ed2617b6e5bc63ae4a1d3894a5db737 --- /dev/null +++ b/params_shard_252.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd82343733056fb54bcd3c3a776bb8eae99922f2f1cf5f6403f88f5ecd2b755 +size 117440512 diff --git a/params_shard_253.bin b/params_shard_253.bin new file mode 100644 index 0000000000000000000000000000000000000000..86531ac946bace4ae4548732028326bbbaca7114 --- /dev/null +++ b/params_shard_253.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266dd980536c6396276ed2ee5b7be427d4e3634f7d41564ddc7aae62f53cec85 +size 234881024 diff --git a/params_shard_254.bin b/params_shard_254.bin new file mode 100644 index 0000000000000000000000000000000000000000..659af2bcec2a8f3bec59af7a19f578e5e77f2091 --- /dev/null +++ b/params_shard_254.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f856e5148ae4a2180af0261933f9e5857001da9a3982904d42010f9c0c50f47f +size 26804224 diff --git a/params_shard_255.bin b/params_shard_255.bin new file mode 100644 index 0000000000000000000000000000000000000000..4cde8813c63473cc85c4c11403052708aadd951f --- /dev/null +++ b/params_shard_255.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebdc8ff35aa8e7b75877e43d358e46426a4befe7b8f3905524f4bf71c94898f +size 41943040 diff --git a/params_shard_256.bin b/params_shard_256.bin new file mode 100644 index 0000000000000000000000000000000000000000..27e21be96bd1b2870730760637da3d487b2d6023 --- /dev/null +++ b/params_shard_256.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2ccadb16b941a36f1c5e6ce7dd5bff13ab2dcdfd48b1145aaf083c9b9bb722 +size 33554432 diff --git a/params_shard_257.bin b/params_shard_257.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c85f8d61f76dc2d42f159e73ab78153668f1769 --- /dev/null +++ b/params_shard_257.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c785fab2c97ede3295da1e5b56afb9bdf597298ef699d43668edc6f50b9e6f +size 117440512 diff --git a/params_shard_258.bin b/params_shard_258.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c138bbf34f037ca1e702bb7d9f3a99a46f40914 --- /dev/null +++ b/params_shard_258.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bbc128334f73635ef9b2d4df38a77dc717a0ab63fbb7b0e89c0c6434753eda +size 234881024 diff --git a/params_shard_259.bin b/params_shard_259.bin new file mode 100644 index 0000000000000000000000000000000000000000..a776d0546765e6870a4a21d36b91fbc66b35ded1 --- /dev/null +++ b/params_shard_259.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfb573874289d4e3d2056ede40e2566fc6515ccd241dcb6f03160e5c3497f66 +size 41943040 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..6be088425d2e8d566a91164124477426ae41a412 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbeec9bfc2eb8a56ba8ce7fdf1f9f6fe10a8b940777ae757c2e859537dc6ada7 +size 33554432 diff --git a/params_shard_260.bin b/params_shard_260.bin new file mode 100644 index 0000000000000000000000000000000000000000..58885ec6bebf51e9eaa2aef315feb72960f8a0ba --- /dev/null +++ b/params_shard_260.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd37163b36fc5ee1b62b2ef2797309d47f09204b641ff5cadd06d3fcd82be2b +size 33554432 diff --git a/params_shard_261.bin b/params_shard_261.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a201131e204872a1214f15a8e4876925752db2c --- /dev/null +++ b/params_shard_261.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac4bbb7699ebea702f622d77eb533c513262a94b2637d39cf2fbef68451e98a +size 41943040 diff --git a/params_shard_262.bin b/params_shard_262.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8202136e365d9fd7273882a8109003a7044b3fb --- /dev/null +++ b/params_shard_262.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d5ceb6cde3778b1302ac296374eac6579cda4d9ecfb7d2c92991559f9e7c0a +size 33554432 diff --git a/params_shard_263.bin b/params_shard_263.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f78113433d5b9e0b03b1cff58659941ec146b57 --- /dev/null +++ b/params_shard_263.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60e34fba6f9ed3871056b294bda5eb249188d9126c9532b99c32cccf741b2a4 +size 117440512 diff --git a/params_shard_264.bin b/params_shard_264.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa2e6a526c0ffc3179d28622b094d7ce5d0c2995 --- /dev/null +++ b/params_shard_264.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3baeb303769ae12a9a0264e320558f9bdbe60ca3c723b94a6709118d18da1eed +size 234881024 diff --git a/params_shard_265.bin b/params_shard_265.bin new file mode 100644 index 0000000000000000000000000000000000000000..f226a34359bf07ce30198e625b3132b686cfb57c --- /dev/null +++ b/params_shard_265.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19f0f09c050a730a5e25b7a8aa4b50998b483e77bae9946dae564a39ef358f5 +size 29163520 diff --git a/params_shard_266.bin b/params_shard_266.bin new file mode 100644 index 0000000000000000000000000000000000000000..80676e415420cbe085f1f5ad9e89b4559e95332b --- /dev/null +++ b/params_shard_266.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ca2f71f75139fe6ab124b65b43fbc21edcd8120323d98ad65cd1c15541eeac +size 117440512 diff --git a/params_shard_267.bin b/params_shard_267.bin new file mode 100644 index 0000000000000000000000000000000000000000..64aa8c8561c9120b88e07b50cd1b4132af1b92f0 --- /dev/null +++ b/params_shard_267.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fc40b11d1ce63681307beaeabbee97aa87393224d73e5c97840d131d7f729b7 +size 234881024 diff --git a/params_shard_268.bin b/params_shard_268.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ec69b16dfd52ca26aa3d9cb377f5ad806a27ea8 --- /dev/null +++ b/params_shard_268.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e498a9117f06834046e933440baf4ca033dc1e77cdff71eb26b3faed2329f0c +size 41943040 diff --git a/params_shard_269.bin b/params_shard_269.bin new file mode 100644 index 0000000000000000000000000000000000000000..d53b54366cfc3e9307ada8133f5b881134a7b5b3 --- /dev/null +++ b/params_shard_269.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4e98177bd2a696c2e2892a10daea3e35d8c663b24d12d4efac3b5f9ab62d4f +size 33554432 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..770554800b53c92952494b9605e647662aedfedd --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45548b1909378689960058ccb9b8c553bf210d22eb579c85be10815bac4d4af4 +size 41943040 diff --git a/params_shard_270.bin b/params_shard_270.bin new file mode 100644 index 0000000000000000000000000000000000000000..3804609bb285de81f093d16156e197926a1abf54 --- /dev/null +++ b/params_shard_270.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b2afebe10a1152994fbb5a3da7e105e2679e0c5248d76727a07e44c71d93b40 +size 117440512 diff --git a/params_shard_271.bin b/params_shard_271.bin new file mode 100644 index 0000000000000000000000000000000000000000..3af72edebcf8ca710941897fe983ac1ed57229e6 --- /dev/null +++ b/params_shard_271.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffeaccadb46c8ccd23bd611bf01b23ba0654c4d4c49af693effdb497b1c001a7 +size 234881024 diff --git a/params_shard_272.bin b/params_shard_272.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2601844ff0adb83d2aff4aec1802abaaef10c1f --- /dev/null +++ b/params_shard_272.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850cc56b2b6c7b8cf7927ed8fa3a5bfc853d775b1d6b8e49d893c4478e027796 +size 41943040 diff --git a/params_shard_273.bin b/params_shard_273.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f7880beedd3221b4399c9d4f3a0ccc96eb094fc --- /dev/null +++ b/params_shard_273.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e301df6be73f8be4cfb11257aa9aafef647a02f19b00bd0dd94b5c4b7ca969 +size 33554432 diff --git a/params_shard_274.bin b/params_shard_274.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1652d02ca263b06a7043d037093f3ea4a665809 --- /dev/null +++ b/params_shard_274.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3abfe392424aca2fb800bcc43a79d75b65a4cf79759c9978d1e651aa8a20ff8 +size 33112064 diff --git a/params_shard_275.bin b/params_shard_275.bin new file mode 100644 index 0000000000000000000000000000000000000000..dae4dc3c9796f89d71f5a25b65d73a5ad98bf0b4 --- /dev/null +++ b/params_shard_275.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494dc47b14fdc186dafdf5357ee6c64da9edcd014839e3f76827037195f548e5 +size 41943040 diff --git a/params_shard_276.bin b/params_shard_276.bin new file mode 100644 index 0000000000000000000000000000000000000000..88917fa10d4e9fc40cc5a7274c51187d32f4f991 --- /dev/null +++ b/params_shard_276.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eca557325f34e3ebb424d5497c952f0238479b468b4b8d97ea039aa2af2a984 +size 117440512 diff --git a/params_shard_277.bin b/params_shard_277.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dd05dcd15b862e9f7d37ac3e8431713daebdc3d --- /dev/null +++ b/params_shard_277.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d3b7aa182295e329f68e08b388727253f6dbd565d7d41e4b02f410e76e5949 +size 234881024 diff --git a/params_shard_278.bin b/params_shard_278.bin new file mode 100644 index 0000000000000000000000000000000000000000..b47d25a84b09e170c62da84405dc50404e9b4976 --- /dev/null +++ b/params_shard_278.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1228c196e189ca5857b4c894381b27936785fc8c82681b7b661e249ed13376f +size 33554432 diff --git a/params_shard_279.bin b/params_shard_279.bin new file mode 100644 index 0000000000000000000000000000000000000000..16b74dcbc209a97a68e686c8e593b14f78541f79 --- /dev/null +++ b/params_shard_279.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ed41034a679d0bd72276231be473b1df63e3a32bb0a5e08df7f814f862637d +size 117440512 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..983ab727642fd575f4ef4ac46c281ef7dae901ef --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8310357eaca46ff079897fac98751b046e39cd6f0ee055b3d79000efe699f1a6 +size 33554432 diff --git a/params_shard_280.bin b/params_shard_280.bin new file mode 100644 index 0000000000000000000000000000000000000000..67c29fe1ed0ba648514577141dfd94494d1d11ee --- /dev/null +++ b/params_shard_280.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3779f31d73229786e3847ad304439d18f2bffc06b6fbfeaa30ed83b07b7c7de +size 234881024 diff --git a/params_shard_281.bin b/params_shard_281.bin new file mode 100644 index 0000000000000000000000000000000000000000..9cc6c5e4dbf91a7586bc50603b70964f6cd114aa --- /dev/null +++ b/params_shard_281.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09cc6753c59c58a0e3afc25fc2913b6a4c6f2313ff7045014b58859fd05e924b +size 41943040 diff --git a/params_shard_282.bin b/params_shard_282.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad3b1db85ef75c8ae66620e4d1af203a482dbc88 --- /dev/null +++ b/params_shard_282.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7780090be608d2328730e7276a9ca3d7abbc638072c3878eecdfbf91f4f6e9f +size 33554432 diff --git a/params_shard_283.bin b/params_shard_283.bin new file mode 100644 index 0000000000000000000000000000000000000000..47d314a3addfca6f962554ee3b0f568317331ec5 --- /dev/null +++ b/params_shard_283.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39015cf78b951b20f0619eae296b434fd578a5ef863d4efdc5ca70fb81f43f19 +size 117440512 diff --git a/params_shard_284.bin b/params_shard_284.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbdcc40254bbebc0d92a028b7811803414ad25ee --- /dev/null +++ b/params_shard_284.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf124e03ea02e78c3dafb678d6c5dac196c2f1820eca09bfb2fbd6c2196087ab +size 234881024 diff --git a/params_shard_285.bin b/params_shard_285.bin new file mode 100644 index 0000000000000000000000000000000000000000..998d78b12cb215dfdfb89fe653868e55017e2d1c --- /dev/null +++ b/params_shard_285.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6250ae935071654a77131132b1b9ffd46fa7919fcf53282b379267623021bb64 +size 31522816 diff --git a/params_shard_286.bin b/params_shard_286.bin new file mode 100644 index 0000000000000000000000000000000000000000..45ba22707808d2334039bfe20c3433d739f3efca --- /dev/null +++ b/params_shard_286.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d611a043f63beb75b792f7d701969c609d81a6dde57f886752badec18a1e0279 +size 41943040 diff --git a/params_shard_287.bin b/params_shard_287.bin new file mode 100644 index 0000000000000000000000000000000000000000..441e559abc79762ead19aef14bdd79752f0de29b --- /dev/null +++ b/params_shard_287.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac754510444fd6615041b2f953ffdd7a27360623e6cda69c1f6da7c153f8c1d +size 33554432 diff --git a/params_shard_288.bin b/params_shard_288.bin new file mode 100644 index 0000000000000000000000000000000000000000..df1715cc496a75b916950eca85d3ae4c21d95d37 --- /dev/null +++ b/params_shard_288.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85be3e7fc6e687bcb5ed70f8820c15f105c6cfe3c3e8620923369813888fd02 +size 117440512 diff --git a/params_shard_289.bin b/params_shard_289.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e70dbc952fd13c0291062b34e2e13737f8ebc0b --- /dev/null +++ b/params_shard_289.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174f7b7d6b8856551a4c55ab27ab123c90be66f8df2189759856a9a867bbfff7 +size 234881024 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..33d5850f37a98506145ec847c22edd6991baf92d --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1e80b31f3dd2c8bfc2487cbdee48775a32d1298f7e0423db7fa07bc9c01e87 +size 117440512 diff --git a/params_shard_290.bin b/params_shard_290.bin new file mode 100644 index 0000000000000000000000000000000000000000..e38fac6b75155b60776a9914edbdba14c7c95919 --- /dev/null +++ b/params_shard_290.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe39d7c7ea7754f511740953c8629aaa275ddf1d460c0ad98e61645822402af8 +size 41943040 diff --git a/params_shard_291.bin b/params_shard_291.bin new file mode 100644 index 0000000000000000000000000000000000000000..31119679026cfe0949b3c1cd2321bb6c69c5d428 --- /dev/null +++ b/params_shard_291.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b5912936269fec55a8639d51d5d817ecd3addbf22dd34db320db8b8de97ab7 +size 33554432 diff --git a/params_shard_292.bin b/params_shard_292.bin new file mode 100644 index 0000000000000000000000000000000000000000..18530b18886ba5c58debe78eb83e69d718725f4b --- /dev/null +++ b/params_shard_292.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ffe7815fbdeaa246f224897fe98a102ca3b1eb44149daf4e63d7ab810d06e3 +size 117440512 diff --git a/params_shard_293.bin b/params_shard_293.bin new file mode 100644 index 0000000000000000000000000000000000000000..c04a40f55d7c2d27085311746b45ce4fc4afa139 --- /dev/null +++ b/params_shard_293.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf78034fcf1a4161b432e332a33fd28e56bc568b8beb4bf2f5167f623ee12cb +size 234881024 diff --git a/params_shard_294.bin b/params_shard_294.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0e99968bbf0f66566b6c883c4a7961e64cd3bdf --- /dev/null +++ b/params_shard_294.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9819de2ed435334d831c7286d4974582266986bba0744c16e2a4ea41794bd8fa +size 26820608 diff --git a/params_shard_295.bin b/params_shard_295.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a6cec8351a18a911ee0523bd6b7f3435ca7e458 --- /dev/null +++ b/params_shard_295.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa931f5075d3ae3a2c9ac045f633e3659f79346fb0a4aa83855929b304861be +size 41943040 diff --git a/params_shard_296.bin b/params_shard_296.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3de4a3b3b25d0ded96dd3e27393cedf396134a8 --- /dev/null +++ b/params_shard_296.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b406a6358eb0e56411679ece7d3026c7f73b84f8ae11cde997420067075ca56 +size 33554432 diff --git a/params_shard_297.bin b/params_shard_297.bin new file mode 100644 index 0000000000000000000000000000000000000000..b32e8181565ddfe32075fe7d99906a192baab2b5 --- /dev/null +++ b/params_shard_297.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4c09a8ab49216538d197f6358d321c9e301db2ff9c9a68ad97280b571502e8 +size 234881024 diff --git a/params_shard_298.bin b/params_shard_298.bin new file mode 100644 index 0000000000000000000000000000000000000000..357cdb231288e630e2524f28ae2280cda5fd4b6b --- /dev/null +++ b/params_shard_298.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734516eb4eb5ede22fc9781de9028f773684cc21e25ec957a13f820c3144bbe5 +size 41943040 diff --git a/params_shard_299.bin b/params_shard_299.bin new file mode 100644 index 0000000000000000000000000000000000000000..943d749f8bc272102906147ef3a81e8ba9f17b18 --- /dev/null +++ b/params_shard_299.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:807c41750dd1a2c92bdb23b4649eb056b63f85057911a0b32324e0efb7f861bf +size 33554432 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..72114dbe094280cc2e366334c6238b342f0706da --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e21f24149e38222fa4041952650533a376326b91edd9d943ed1032a447ea70d2 +size 117440512 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..f6c9a49ca03d09e57a0ae5b6da366dd05f98da5f --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb56950d2b52526f2a9afb4e02527cf303887c24e4348387061c4edc1031f9dd +size 234881024 diff --git a/params_shard_300.bin b/params_shard_300.bin new file mode 100644 index 0000000000000000000000000000000000000000..48f2f6c294d5bb849912c619017bb9ce855a6bae --- /dev/null +++ b/params_shard_300.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0416b7b117f9200ff4ddd15f2cdab2375e39362fac0478d1c924d1cd2064b679 +size 117440512 diff --git a/params_shard_301.bin b/params_shard_301.bin new file mode 100644 index 0000000000000000000000000000000000000000..34a02650d060b10eb1e288186af488c9c6f35fae --- /dev/null +++ b/params_shard_301.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78ae5e645660ebc5842d1c187a371545cff273f975521c2ce0b31a3426cb445 +size 117440512 diff --git a/params_shard_302.bin b/params_shard_302.bin new file mode 100644 index 0000000000000000000000000000000000000000..dff8b03c37928af8d04618034810fca78d9e6529 --- /dev/null +++ b/params_shard_302.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:617e5a8a2b43da6851873be9fd7ae29f0a3ec360169299da5274e7d7a665b157 +size 234881024 diff --git a/params_shard_303.bin b/params_shard_303.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a987026ccdbdc84e6fb6fdab016b8237b2f37b7 --- /dev/null +++ b/params_shard_303.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2827703f2da5286c22c2477daddb3d9282964433240b37a07f5b4c1e7eb66c1e +size 26804224 diff --git a/params_shard_304.bin b/params_shard_304.bin new file mode 100644 index 0000000000000000000000000000000000000000..02c759f9a072fa6eeb7a0dede4b4f19aae0b5235 --- /dev/null +++ b/params_shard_304.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac97cbcd6d2edcf1556db4792195c4989ba44a66b94b45798215dbd69e4984c3 +size 41943040 diff --git a/params_shard_305.bin b/params_shard_305.bin new file mode 100644 index 0000000000000000000000000000000000000000..b03f59518a9c80aee48a21dfb954c39f301179f6 --- /dev/null +++ b/params_shard_305.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9901f4237b78cd6f5a3ee6673c787bd10df7c90105eafbd3081b12516970cc4 +size 33554432 diff --git a/params_shard_306.bin b/params_shard_306.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7a6a51a6dd014da2c26fe28e13fd1be28418250 --- /dev/null +++ b/params_shard_306.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f97fb64f9c871e7372681d35fa39597049b9d1b5ae1a282cc5ad9a2b2591db1 +size 117440512 diff --git a/params_shard_307.bin b/params_shard_307.bin new file mode 100644 index 0000000000000000000000000000000000000000..3f72cb0ba8a1e27e4ff2c58da283995975b85ba9 --- /dev/null +++ b/params_shard_307.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:299ac728e8643eca5c39913abd4cb5bc01ccb0e86d30d82d4a39325a744e60cb +size 234881024 diff --git a/params_shard_308.bin b/params_shard_308.bin new file mode 100644 index 0000000000000000000000000000000000000000..91d2ea9e83adec959f02c51124cf02556795b4b4 --- /dev/null +++ b/params_shard_308.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f4df7a3f517913f243de38e364dfc5fa5fdd8cb764a5992cff25f8d6d66a83 +size 41943040 diff --git a/params_shard_309.bin b/params_shard_309.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1e9152f4e7b90bbfcac3be2abdf69610b12696b --- /dev/null +++ b/params_shard_309.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6fb1fd3278fef68aba3c87a760996df3afae86542e19771bf556392de2d5af +size 33554432 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..0dd051006e17f7af6332e1f9811dffe465cb9139 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42cbf2325b6c6cadabcf36404042149c49f1801318077882fd07f5282246ed4a +size 29163520 diff --git a/params_shard_310.bin b/params_shard_310.bin new file mode 100644 index 0000000000000000000000000000000000000000..5def10b0ca40632ebb0b473e8eedbfd2a03a149f --- /dev/null +++ b/params_shard_310.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41a6814efcb273c829ca2561c192050b229b6ba49fb0e7750809377b7a26622 +size 41943040 diff --git a/params_shard_311.bin b/params_shard_311.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8316239e598b542482a37605f34e29083d76c64 --- /dev/null +++ b/params_shard_311.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7104c2e372543c0f057ebf8ef2b11d8a0607ee39cb26851ed5987338a719f78b +size 33554432 diff --git a/params_shard_312.bin b/params_shard_312.bin new file mode 100644 index 0000000000000000000000000000000000000000..a207bdaf9b6774fce70a61350e3d52681f769574 --- /dev/null +++ b/params_shard_312.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2278e8926983ea88f105c569d22d829fed04685adfe2683f33eefcfb12f8bb00 +size 117440512 diff --git a/params_shard_313.bin b/params_shard_313.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c1ff93cac9accd78198b1489d81bf735b8c1a1c --- /dev/null +++ b/params_shard_313.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908b2b7acf49a98319e60c2c8882cf3b676700f7f40489651b38df065aa242ac +size 234881024 diff --git a/params_shard_314.bin b/params_shard_314.bin new file mode 100644 index 0000000000000000000000000000000000000000..cee46b9a573eb223a908ef7aa4c6651038c81e2c --- /dev/null +++ b/params_shard_314.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c11b7b450fa9cb7400560c608a0e46f2a1373909ca808c043d45baf60db8c56 +size 29163520 diff --git a/params_shard_315.bin b/params_shard_315.bin new file mode 100644 index 0000000000000000000000000000000000000000..b37f54a8ade08954c0e43cab20579ee78ddb38ad --- /dev/null +++ b/params_shard_315.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b725626a9af2644ac52a48101eb10e7c9e460f4401e1005ce7f2f2494b3671d9 +size 33554432 diff --git a/params_shard_316.bin b/params_shard_316.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fcfe857631abf1a524f16ba363f2d22736c8f08 --- /dev/null +++ b/params_shard_316.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6087eeaf25d9ce98ffd3774a64cffc59a404f47d930a2c4a9898a62f83dc25a4 +size 117440512 diff --git a/params_shard_317.bin b/params_shard_317.bin new file mode 100644 index 0000000000000000000000000000000000000000..f5147f9fd2bfbf819bd98edf7175bf46a0e4cc29 --- /dev/null +++ b/params_shard_317.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e45c221f9fce5842dd1c98f946654e53ce7db0b43574efff7af671b7f6ffec4 +size 234881024 diff --git a/params_shard_318.bin b/params_shard_318.bin new file mode 100644 index 0000000000000000000000000000000000000000..549de6cbfb678a9056eaed3130048bb3fbcee126 --- /dev/null +++ b/params_shard_318.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc99a61a6518142f90561098ee80d7db273e21d8d256ca0cbd95f36e3142d1e0 +size 41943040 diff --git a/params_shard_319.bin b/params_shard_319.bin new file mode 100644 index 0000000000000000000000000000000000000000..7227125bacae97a2777be71ce0a7f201169f1060 --- /dev/null +++ b/params_shard_319.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4330da5e95c5778fad7ec0c89d2532566301f690c138ca1c048b0338c8e08c38 +size 33554432 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..5399ffbf8eaac255889fe743fa888ddd1fe42489 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eae45ae09ab384fe32e0d6f1bfc84a942015d87e3575ebf45781316768ed23d +size 41943040 diff --git a/params_shard_320.bin b/params_shard_320.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8a5bc905f838cb55775a0025bf1e1ad6a8de7f3 --- /dev/null +++ b/params_shard_320.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dc1fa8d7818a0735060885ace5d79ad5d0ce70b4287684df94db4f987e46c4 +size 117440512 diff --git a/params_shard_321.bin b/params_shard_321.bin new file mode 100644 index 0000000000000000000000000000000000000000..b005b89b2c41efeae8c20ed43e8f0a7c207c9884 --- /dev/null +++ b/params_shard_321.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752250fc2dde0de26f5a5e166dc616b8977d1406318a412b693333cb5c9b8b5b +size 41943040 diff --git a/params_shard_322.bin b/params_shard_322.bin new file mode 100644 index 0000000000000000000000000000000000000000..6140a7446e7e1254c47b6c4498be0d81a528bc83 --- /dev/null +++ b/params_shard_322.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b9b7c6fe7914273af2c2ff234134faa4b117074988693790c00f5cd9ae21740 +size 33554432 diff --git a/params_shard_323.bin b/params_shard_323.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab853125e31fc10a215aeaa273dd4d31066ae825 --- /dev/null +++ b/params_shard_323.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fceb0c68b44912207516f60e45faf35bd3e80bf0df9d7a2ab4f98da0498b1b43 +size 117440512 diff --git a/params_shard_324.bin b/params_shard_324.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9af3ae3d57b8abb40ac5a04550e5131b7587b67 --- /dev/null +++ b/params_shard_324.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a18feaa98efca939fc9df5d4613bf885ef37831784d8fd5ddb0a8bec792f62a0 +size 234881024 diff --git a/params_shard_325.bin b/params_shard_325.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a10ea69f40f75bdde5ce1ecb4d9ae4de73114d4 --- /dev/null +++ b/params_shard_325.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da55da5cda4b2bcc98bd011ad1fbb60ef830a2877d4a4f5ed759a5a21eb10f85 +size 31522816 diff --git a/params_shard_326.bin b/params_shard_326.bin new file mode 100644 index 0000000000000000000000000000000000000000..a543345de382d0523c9e7a41bb36b7803735c7d5 --- /dev/null +++ b/params_shard_326.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb572630a2159ba048ddbe1429bea27dae9285cb9650c73a4965255515041b6 +size 117440512 diff --git a/params_shard_327.bin b/params_shard_327.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0cb61030a931d2abb2a75989d904e526e614856 --- /dev/null +++ b/params_shard_327.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79fb9dde16ed309a59ff7967b0da5a28e17e180941cf0d2a4bd3f877315dd7da +size 234881024 diff --git a/params_shard_328.bin b/params_shard_328.bin new file mode 100644 index 0000000000000000000000000000000000000000..37b166332dea719ae31c1dfaf5e642607511eeb4 --- /dev/null +++ b/params_shard_328.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b4e0eb741a1f119ef3d33610c68028a25625348b48bcd9befccea0f41edcb3 +size 41943040 diff --git a/params_shard_329.bin b/params_shard_329.bin new file mode 100644 index 0000000000000000000000000000000000000000..f92554a3a1953f1b7c54a6389929c328ad943f07 --- /dev/null +++ b/params_shard_329.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a48b10321131f5c924caccdc8c9b45d9b48d4efd618ba41f918dba86be2780 +size 33554432 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..7971ddf30a49092c7ec8e62742eeb564cfe3be40 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba77cf13c62d3df92666e8d745f0ccecc2c2d708b291176640ef47dc4e31b50 +size 33554432 diff --git a/params_shard_330.bin b/params_shard_330.bin new file mode 100644 index 0000000000000000000000000000000000000000..9de1cfcad507469f24c70f761c472a7ccb62c194 --- /dev/null +++ b/params_shard_330.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5aa5fddccc2c734b0af8656c5ca47926738f4f4991071440d92c1075eef593a +size 117440512 diff --git a/params_shard_331.bin b/params_shard_331.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bb2bd267d16b152674d313f7de7a3a80ca6d688 --- /dev/null +++ b/params_shard_331.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58e1c0da36c03941cc7903a6cce13c3c47651811d9e0cee7b5aadf199fec18b +size 234881024 diff --git a/params_shard_332.bin b/params_shard_332.bin new file mode 100644 index 0000000000000000000000000000000000000000..9974b72e663c3fe923d167a01f6812b7904fb0c6 --- /dev/null +++ b/params_shard_332.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9abc90a1b36ecb94d0897081745a8618c9c9a6be6d0d22a6af0bf9f8da9f8b31 +size 41943040 diff --git a/params_shard_333.bin b/params_shard_333.bin new file mode 100644 index 0000000000000000000000000000000000000000..471e18c67c9b476d92ea281326fd36ef93c24b98 --- /dev/null +++ b/params_shard_333.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442c1bb1226709b9966fc211054df221fd992879b103e87925c560705cd77929 +size 33554432 diff --git a/params_shard_334.bin b/params_shard_334.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b92205f154bd69675e06a70a75fd9b9d88bf951 --- /dev/null +++ b/params_shard_334.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e038c0fd540e5cccb0a021a9ba3acf8d033d87787adf408420c7cdb3e002f3 +size 33112064 diff --git a/params_shard_335.bin b/params_shard_335.bin new file mode 100644 index 0000000000000000000000000000000000000000..83930f3ff2061707e62a1aa63b46d5f4612ec9a7 --- /dev/null +++ b/params_shard_335.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b916161a96dffdcc9d66cbcb66f5a17e7d2206ba363bc9d10abf29eee7198cfc +size 41943040 diff --git a/params_shard_336.bin b/params_shard_336.bin new file mode 100644 index 0000000000000000000000000000000000000000..e997ff4f098b9d4f33fd3ac50dd190fb3fca995c --- /dev/null +++ b/params_shard_336.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ee7c645dd2237e28909b411dc70aa6524ecda66b08f15fa1b6b283f74d8a0d +size 117440512 diff --git a/params_shard_337.bin b/params_shard_337.bin new file mode 100644 index 0000000000000000000000000000000000000000..17c20ba49f02ec4071d014d6655c4531392ef74b --- /dev/null +++ b/params_shard_337.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857c668a56a7e8924aaa8bd6737a8be6d3d199a43de8da2f79281660243619ff +size 234881024 diff --git a/params_shard_338.bin b/params_shard_338.bin new file mode 100644 index 0000000000000000000000000000000000000000..8924617b73227f1b6cf1dc1686aa2602172a0655 --- /dev/null +++ b/params_shard_338.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a8eb393888450a3b0954cab1bf0d2793581422381b951415ca04dc3183e0c0 +size 33554432 diff --git a/params_shard_339.bin b/params_shard_339.bin new file mode 100644 index 0000000000000000000000000000000000000000..939dd9d6688a2d4c782b797af200f39682b077c4 --- /dev/null +++ b/params_shard_339.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb988d50e0380f1c99f7b47afb180e9b97be4d431702fc11be803e0284bdaae +size 117440512 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..5de1792cfbf458f6cb8d586a94256ce916371473 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340a8a8f33db3fc7078f8beeb24e96661cbeb11a87c41251e851f64f87808b18 +size 117440512 diff --git a/params_shard_340.bin b/params_shard_340.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ccfe1232dcd183087286e492584333eff0a4217 --- /dev/null +++ b/params_shard_340.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a186724b3d5db21228bcd7ee33892d56237d028a54ce3949db2c7e75abe87a78 +size 234881024 diff --git a/params_shard_341.bin b/params_shard_341.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4c457a7ae943a30dc731af4e3b535b81a2744b7 --- /dev/null +++ b/params_shard_341.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd49e4de2c051349c3c99a1dfbf09a67fdd0eee7763daf02e7c4d93b62d6c979 +size 41943040 diff --git a/params_shard_342.bin b/params_shard_342.bin new file mode 100644 index 0000000000000000000000000000000000000000..15d8d16fc41cfc13ca47de90771ccdb46541f462 --- /dev/null +++ b/params_shard_342.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f457b5457f045fdf0a1c0345f6e2adfbec1f2c27a6cf6863761b63caf2a261c6 +size 33554432 diff --git a/params_shard_343.bin b/params_shard_343.bin new file mode 100644 index 0000000000000000000000000000000000000000..39a7c7e6ec6f00081f7d6294ff25490a7c259e31 --- /dev/null +++ b/params_shard_343.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2fcc46ca64ca352b4d04c89fca02851a73dae896f50640ae7fd2ecdab5bf9a2 +size 117440512 diff --git a/params_shard_344.bin b/params_shard_344.bin new file mode 100644 index 0000000000000000000000000000000000000000..c00c62e97119e929dedf444357f9ce4c6b9f83a5 --- /dev/null +++ b/params_shard_344.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b9dad4e18b0b607272e680e0cc7587ca6d4c5b3cde986b79a0039a67d5b6ee +size 234881024 diff --git a/params_shard_345.bin b/params_shard_345.bin new file mode 100644 index 0000000000000000000000000000000000000000..ae871580fb4aeafab2003e602b05dfe7b32be4ef --- /dev/null +++ b/params_shard_345.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149245d90530419d9fc12967bc6208e622cd542bf0cc22b48b0fcc66e0673c6a +size 31522816 diff --git a/params_shard_346.bin b/params_shard_346.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0aca04df534f432df15f6866a31a520f258794e --- /dev/null +++ b/params_shard_346.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6cf77514fada9afca0bc2ed4a18ea2be4a405f68db156512e3fbceaed73a01 +size 41943040 diff --git a/params_shard_347.bin b/params_shard_347.bin new file mode 100644 index 0000000000000000000000000000000000000000..00dd752e8c0b574faf5180f7802de1bf49218681 --- /dev/null +++ b/params_shard_347.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ee98e1e054ecea7faeae8df202ede4e4e30819922c33d16c3679ce69402da7 +size 33554432 diff --git a/params_shard_348.bin b/params_shard_348.bin new file mode 100644 index 0000000000000000000000000000000000000000..24962a227f02589611575f0681ec84bab7899b5c --- /dev/null +++ b/params_shard_348.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873e8fcb211f8e97992ce912b63b423d8420bbb5ca330cfd6681cba775ea420e +size 117440512 diff --git a/params_shard_349.bin b/params_shard_349.bin new file mode 100644 index 0000000000000000000000000000000000000000..4901f13df48ddd7d2730fe37be844a8f3d30c3c6 --- /dev/null +++ b/params_shard_349.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33d666055e03faed825a011b71872b4d44c08de2d2bf1c406dcb3292bd77902 +size 234881024 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..a09ea5b79a118c8f7d6b2d9bcc80219ab1f426d6 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca8b2bf3f60b0d984c33b97d2adc20f7586bb78956b11b7d7ecb08f53bf0ea7 +size 234881024 diff --git a/params_shard_350.bin b/params_shard_350.bin new file mode 100644 index 0000000000000000000000000000000000000000..b70cb469b523d683ed9e7848def84a19142e2375 --- /dev/null +++ b/params_shard_350.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0dcd88b0c3641dafb6eef4e1eb684c00b877418aba4db14a5f78c4a15e58f2 +size 41943040 diff --git a/params_shard_351.bin b/params_shard_351.bin new file mode 100644 index 0000000000000000000000000000000000000000..97fd7ed73261fe866dd6f86c5cd462d7f4b22dd8 --- /dev/null +++ b/params_shard_351.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704622292db2a255187f96675b0234683583de99b327bc3e5695f9ea5d958b2e +size 33554432 diff --git a/params_shard_352.bin b/params_shard_352.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6cb8d287bd3bc7aa60094a2636728c2965fc954 --- /dev/null +++ b/params_shard_352.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459315cc5ee9dc147079e47b556dba951e30ac854323c2a6f24b7290f5a87f8f +size 117440512 diff --git a/params_shard_353.bin b/params_shard_353.bin new file mode 100644 index 0000000000000000000000000000000000000000..c611270294a20aec15fdc45d0e393ca973df686f --- /dev/null +++ b/params_shard_353.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ac1cb027fc281f5c6b93c0e60e290dc7278c92ecfd4a7679abd9e347a67555 +size 234881024 diff --git a/params_shard_354.bin b/params_shard_354.bin new file mode 100644 index 0000000000000000000000000000000000000000..a1172a714aa1f9f48779a8d5aa4a571f55ef9cb8 --- /dev/null +++ b/params_shard_354.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f49fe2954be9420ccf2b1ec98a18910260178ed62d280840cd5588c478742f +size 26820608 diff --git a/params_shard_355.bin b/params_shard_355.bin new file mode 100644 index 0000000000000000000000000000000000000000..7318642d45c222fa209f25a4f210eb39da3337a7 --- /dev/null +++ b/params_shard_355.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd60c960271ba2cb950b1a951eb78affdc7bf173f9dbd2dd22e07fddc219d88 +size 41943040 diff --git a/params_shard_356.bin b/params_shard_356.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d94028f920670633a0c4598cbdb52140d1d7c35 --- /dev/null +++ b/params_shard_356.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077e6e9f4f86c75e004b9304ed9d8befc4c06967b684fc7c51d1c009d3a70bd5 +size 33554432 diff --git a/params_shard_357.bin b/params_shard_357.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2bb1d6e04a47f3758a0bf0182da8a240cb1c7b1 --- /dev/null +++ b/params_shard_357.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bcd886592f9626f4f2dcee49c86a16f036827703fc41eef8184333706e7d719 +size 41943040 diff --git a/params_shard_358.bin b/params_shard_358.bin new file mode 100644 index 0000000000000000000000000000000000000000..52672e1fa7ac0d11d5226509be0df6dafb299eac --- /dev/null +++ b/params_shard_358.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e216d304830212d3360933af4dc97a86f60f68914f43f38e1a2273f45ba22f +size 33554432 diff --git a/params_shard_359.bin b/params_shard_359.bin new file mode 100644 index 0000000000000000000000000000000000000000..a805fbd00fd8b7c570af1f1fcf8dda2b39baffa9 --- /dev/null +++ b/params_shard_359.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d71db6edef17ed24d8eba304bb88f5e35d5ecc72ba689d01b4badf669d87b0e +size 12075008 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2a92201e5b3d0bdc5131125786358102bb36e07 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e79803323039fa9e71a9036d2ef340fe91a2fabbd50a0b2f3a1371ce2e84d95 +size 41943040 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4899326975bc639039f8c34ea5733d5016a75c0 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6baee5f92fd55b4afb91a9f72e34aeff6950e22eea79baedd9d1a412c5874724 +size 33554432 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee960947bbdce1813006c506316375b7a88d6476 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428ff9c13f92ecc215283ce903a6ee848d17b0ef568bf02f7053a4d3ebd4710d +size 234881024 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..35e36516c412c8bdd591d1874a9db74c3cca3dab --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfdddef0984a55e7af914cdfc5b7c119e380e93ae53f10feaaf27ad2d986d06 +size 41943040 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..5dced6f776033e2eb59975f2f215aaa324a98066 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66557dfaf0607c8b46fe0957ae1c08c0939dffcb0cc92217211807cbee3bf0ff +size 234881024 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..56ea49d464e8c9111fb183567f71cebca0a28a14 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe0a55a21db1f6e94ae2ebc0434daedf78c76314d5b1279577abba82db3db8ac +size 33554432 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..90dac0b4bb7d39055936c9881dca25b7f593dd36 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5f23cbb27738b5b22af01bdcd4faeacea282b7d79067d6e871b1e158fe9968 +size 234881024 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..3279ccb1442678e10ac82636fb3c303afd564570 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7bcf72cbf974fdce3d9b4a04cb1ed4a28e4045b03190a2da9840798cfc41fc +size 32833536 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..b48532f4cb869cd03969ebd4b9e3699bba600cb0 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44a4166708b1647242b492e4e9cc8fdbbcf5f5c5e8c8842626f80acd2a1aad6 +size 117440512 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e4f2a5488aa1132413819c943d8a09d527f6967 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7a439afd774c97be94522f802c5b0b17d6bc04a9e16da4a58be3f302f200d0 +size 117440512 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..b52d4b91e669da234add3486e98a8bd7b650d78b --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073da908388edc86aa7f10842bb24ccd6e3898ff7c59cab2ed36f2c72d9595eb +size 234881024 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3d540f9e97f7b9c7eb4616f466d80df6fddbc09 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8467c4b2f085cd7b0bb34c81f3723d9bdd1b99c5106a318e4c7d7ab5b84fc9a +size 41943040 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ceb6317206de0320da2249a4cb6365c5d079b0 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc8f78b215af4f053f80534b3f5cb4beeb47ac6701517b4ae3f5e4d314f73e7 +size 33554432 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..899b5dbe862dc48a97dba306c5d7f7c2deb46fa2 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee33ddbc1e36aa18bb261ad53b44b10ead4c5d89d8034119f6e68c57e91df38 +size 117440512 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..0155a6a6d2b8bf9706f7331a0303eb71ef475239 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd05f65bb828bff920aac3c66df3af3e10d1e26795c728e85e14d49ef7e3f8dc +size 234881024 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..294b510c4b4eed7ae9592323e7110fdb2b7660b1 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd5eddbb39054924d5fcbf5a40aed872b9b16c4d305d4bfca25fea0382da9c4 +size 31145984 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..93f4f37df802d54ef5d7befa8b5ee9a2762e2c01 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2300fd0f979c179aa63d3233beaab929f53b6e43b609d3359a9300292ebcd10 +size 28147712 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb84dee41b42c6338b171480cfbfbab2d67a6b4d --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84985e8b2815da6e0d14d71667017eccf0fb1070a131754fa5828a85e10fe64c +size 41943040 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..96df7521f3950dcc42e9592f9d233d92ccf5d19b --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41bd3322e7d55e3c1caab56907bd3cb3433f348af46002bead075d587c4b280b +size 33554432 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..eee331ac1bbf3c078a47d0976519d236be4f22f7 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:972fba8b333da7f9edc7737729b8054da1a69fa9b6c819e5e72d0ac512e83397 +size 41943040 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..c68930aae8cc377aa8edeb9560b4c727a3a713b5 --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51facad677003654d05477335f7dbf41d5a9b9410fd70450f0d1217089fbeb1 +size 33554432 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..63390a373e03c46e131712fd57367f9fcb0b79a5 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc8d6be3da8e615e626a5ab3bef85215df4d2103c2b8477a25eda3d5b4abb95 +size 117440512 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..31595af2dad46b5bcec609dea516710439558cf7 --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069417eb5482e3bc34e67fcf60893eefd7ddf4f22806c3cedd9ccb3b4ddc2045 +size 234881024 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..e43381a3998e442afc4244bca0f321520298dc2f --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887e911c3ff08b10a8a08834b0a424a5a702cc0aa9b24ea3c994a8dcb9dcaa77 +size 117440512 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1b85d03cb89d62870ccf58bd03a48687016dcf1 --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f8ffb509c349487964a8127116b183d784454ffa2d6a6b984ea3efe66ca7df +size 234881024 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..46f71464fb6d7bbde8f1035cc2d1fd6dc091856e --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d45c76836eb296a55e7b2c2f881c4ac4aa2c8feda439ceb540d56f32264c4e +size 26804224 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4fdd0eb33559b41a299948cf6ca4d8ee2cd835b --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ddaf6a5ab7af7fb2d81ab563830062dae03252409f4701d433a65f1285e85b +size 41943040 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..75d3f5e452b0be4ae55e1947dd895f1590dc3d47 --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b490f1cafb971a2fe82e587ab057a4df6e2a44ca0ef6b6474803eec218cd2992 +size 41943040 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebad44c4c0f679d65b0960faf85108b599a580ca --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917cfce9919c9429002dd730f7c3bb796e26a8a82e5d71eddbc92dce540ea387 +size 33554432 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb2019112fb7a05288a249a2bf0d9257d01c7dbf --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9285caa19ffded2d50388ff1eb3fbf80a2b67f138a49853b2c548e3920f58e5 +size 117440512 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..df355491a4bfc656e76a503aa59cb7dfef08298c --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6433ed3b88da678c097dfb1c1a1624ccbfcca5b790b90ab3467d3bc77b92e57 +size 234881024 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd6457cd3285558e2a7aec0350fa4e4d90e3ca02 --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e14a1a707b3ffa0a08aba5a34978d512db7f9142b51ed8758023510691ea73b +size 41943040 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddc6ea670a76594c580739f152617145b7e48967 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e908941335e38688906641188f252e6d9f5bf583370e516f6dc12a301c885b0 +size 33554432 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..6bd28728f0177bb03634f2a92a60150960f175e9 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3646e02bd5d8ba256f7fcb29921908e00f3905cde737c3fe34330db63ed485e5 +size 41943040 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8d6a1363b65576efa76c45ea7ef5993c0001dfe --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d35d33c1f8eba5abc1f468522cc99411c43f62b5565df826e4aa7a2909e9a3 +size 117440512 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..94c44a968a47a2f98b380e71fff4c3b15a5d27a8 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d30a21aaf331f7f53a347988141f517855b63a69b292106d33b3331a6680dd8 +size 234881024 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..abe160ddfc2221b75c05682440b3748717ecfe11 --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0da229e502df8e8469c2a87105ff1f38fd1ac7d661beae580008a8a072c3b8 +size 28114944 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0f6f89005ed0a8ae52630b9605f2566b7d73a90 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e619cf6d5f7d1d97e5a2582e955518e7c9279c0d2bf17354a8493d4cc3d4d9f +size 33554432 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..7084287c9e587b42df41e1bbef2dbfd50ec5c20a --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89065f971a457cd3127fbfd6dd806a6b26e73d3588e8c536254d5a1e917c9077 +size 33554432 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..293aacabfe67edd3f0ddb1378b9066c3845a8285 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59501447be786b15e5464b1728b74b8710417a74a884c08db2aa7c56452631e6 +size 117440512 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..c750337ef9a4a3959b238d0738c3dcb72f040253 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83edf023650ddb501948373e2d569bd48fabba6969e34966aeb2a4bfd268d0eb +size 234881024 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..92334550275cdf124244e86148357e6f6aa390ac --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78cb8d20a1a4b09e8da4b0e13902ef5602a1d84b34652c301fcdd33db04109f5 +size 41943040 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..f27fcce33d6d84e77fa43fafcef9e34b6c2c2f78 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0572faad4a7d9f93099d91f1f0ec02c574f902d7921a9cef4f911297ab024405 +size 33554432 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..97737233564b329b487620782d32058a9627ace8 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c59be8b11ee5b2b6d1bb45cbb49532a1c9534fded5a937f79b824738d5a4e93 +size 117440512 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..454b60eb1acd0d7c377ac36a494d35eb503240b5 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b780c3665e67f078ded320491da5232e9cf46c695074dec1bb49a01e098c19cd +size 234881024 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..b98ef58462119e175a8adcf76e17021402eccff4 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b96a9c7ef60975bdfd31710cf4adc481bf3d48d16bb72cb2de7e10d8e832f03 +size 41943040 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..11745b2dfff33bf31b77ecfc3275174e3c5baf3e --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e7292ab329585a210c8da0f53945282907997017fff3ce9f06494c9278e677 +size 32817152 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4ce58fe1306a02c07621dc852d5053fa72604e6 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7185c3ad492acaaf4001d1176d8b0f21aa2419719ce3a266db71eb3fd59e1f01 +size 33554432 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fb0d4f51868cffe2ebe042288ca778a3bb6d655 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82a3a09ee36eb1f2fba480373bf3db398c61b12b202a0f46f5c953f970f5065 +size 525336576 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..aafcd77a548936a7927b02b83d47925308688829 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff1a9384a8b73886b01d295b9b2efd1f932b573718a7a1d3ced9edf41512a0d +size 117440512 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..835e421aeac21bde8842a4966caac07dce93148e --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903d0eb54a37b06a76bb269530c91dd49f4c778dbf141f0e931391e2249389c3 +size 234881024 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..1229dfb07b852908f5d70a955daf85cd0ecb408c --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73639a5386593b875cba6bf66052e50888f479b03f4f38860241bb87cdef5f9b +size 41943040 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..11a74440ae6885fc796d25214d7514f73f76021b --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac22a7d385d51e54a1eb595de2ec7344b8e6c98cb233f6f1398e31e1acc1a86 +size 33554432 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba4dc83adc4b5f96cf780f281ec2260807592cd7 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b797f4f790b892e56d1a4341bf375a2f094639fd393af2cec6590d42d0e5de7 +size 117440512 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2be8e17b6d1b3249239818e6d4c9f5fc58f6545 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510a18ed1c0f208c52f521cb0676f3bedb08e258ae48aa3488d7fe920239968d +size 234881024 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a37d1122a776142e2eda09de19d204496d427ae --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193ebe98d2d55d5b3b54077f3a524552d90b28959d9a2111a6df8492da5d8530 +size 41943040 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e05abe16ff8fa8bd9aba8f3291d2149cc8a8770 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:562888100ff75d1852e6060af0eab9b27088e0c474298a561727da9cefd548af +size 33554432 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d23e9f64ff9264dbd5cba07cda6faf682123915 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8dfd8898ff1f067b6b931199e1a32990118b0e1420b5ce8920922479536297 +size 234881024 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..06d6e70a063c7f76a67859e22a0298e3c8efdf4a --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15704d4437b84efcf8147a16d74de467db81e397f48ad22cc40fba98645a9550 +size 29196288 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..f71a82de639b1433806e6541f852890cd3f3b48a --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43739f3c1a5139be26e579f9606203b5d04a84649eba3df105f8c7168baff734 +size 117440512 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..0edd7a7e997f28afc7a481e28893c036f8ba59f7 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0505a70d4257caf9d93bbd016a6cac8869056a3ecb8251a5154ca9b6bd5a2d +size 41943040 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d4c46e6329a1d037f2507fa90af78cf8097e038 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34a4059ade1f636846a6abd5b0c8baec6bf32ea151ff7b7b31cfd1a28f1ebe3 +size 33554432 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..09232c7c19325ad0bd0e0d743ad3193e97b56b18 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:262d08b3ce73b938dff0676f1d74f440ba603fd404806989e29110bd2c5a8347 +size 117440512 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e511c8a9fd1bac7d9e3cfd8c9daafe289a47a43 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6aef94e3c5d6a80d964e537b8c37668b42c2fcddbe39d0fcdacb3ddf36d0c3 +size 117440512 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..dda3d10a5213deef5a09fc135de0b5f9757ef38e --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d18b0cfbe965a8c9a5cb2de609419ba32cf319079643d64cc3328d6aa0557bf +size 234881024 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d6f1d4585625cc4fe917bcc6234f16528e7bbe2 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91848799ccbf5a55c54c93c12a9cd50d71ec11a6c3850d32aa47a0b9e219abb0 +size 41943040 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a2bc51fed8f92fc452ef1aeba7127544b4cb330 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3349fbaba4bb8bdc33b3b2a4c1d2a0296e60b754fbb34003f6377e2dc203301 +size 33554432 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..85a787748101ca7b6d366cc38710f4b57029e14e --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f01952ddd637cbca2342757ad73936e1acdb9288fc6c40bfd1b35866851928ca +size 117440512 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8516a7c35ec1b30787a9fbf6622a5f98300d7d6 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0de25d6a44479fdccadf163a4f1144b714303c8689925240f36a5279ecdda7e +size 234881024 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..f988287a698183901056e9517d720d6a1444007f --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be13b677d4c0b8a9bf0f55a5bd15a15e4a4beb7adbfe60ce3ac4a6e797230ac +size 30490624 diff --git a/private-llm-config.json b/private-llm-config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fdc034341d0b1f8ccb19ff6471c501e74f31fd4 --- /dev/null +++ b/private-llm-config.json @@ -0,0 +1,55 @@ +{ + "model_type": "llama", + "quantization": "w4a16g128sym", + "model_config": { + "hidden_size": 8192, + "intermediate_size": 28672, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "rms_norm_eps": 1e-05, + "vocab_size": 128256, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "context_window_size": 4096, + "prefill_chunk_size": 128, + "num_key_value_heads": 8, + "head_dim": 128, + "tensor_parallel_shards": 1, + "pipeline_parallel_stages": 1, + "max_batch_size": 80 + }, + "vocab_size": 128256, + "context_window_size": 4096, + "sliding_window_size": -1, + "prefill_chunk_size": 128, + "attention_sink_size": -1, + "tensor_parallel_shards": 1, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "temperature": 0.6, + "presence_penalty": 0.0, + "frequency_penalty": 0.0, + "repetition_penalty": 1.0, + "top_p": 0.9, + "conv_template": "llama-3", + "pad_token_id": 0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "tokenizer_files": [ + "tokenizer.json", + "tokenizer_config.json" + ], + "version": "0.1.0" +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..edb1acf65b93e6dd441a66eba58e669b7cf302ac --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2065 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "legacy": false, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "<|finetune_right_pad_id|>", + "tokenizer_class": "PreTrainedTokenizerFast" +}