diff --git a/mlc-chat-config.json b/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..d129b5e822b49c529d6ed1372a4a52680933f0ce
--- /dev/null
+++ b/mlc-chat-config.json
@@ -0,0 +1,87 @@
+{
+ "version": "0.1.0",
+ "model_type": "llama",
+ "quantization": "q4f16_1",
+ "model_config": {
+ "hidden_size": 8192,
+ "intermediate_size": 28672,
+ "num_attention_heads": 64,
+ "num_hidden_layers": 80,
+ "rms_norm_eps": 1e-05,
+ "vocab_size": 128256,
+ "tie_word_embeddings": false,
+ "position_embedding_base": 500000.0,
+ "rope_scaling": {
+ "factor": 8.0,
+ "high_freq_factor": 4.0,
+ "low_freq_factor": 1.0,
+ "original_max_position_embeddings": 8192,
+ "rope_type": "llama3"
+ },
+ "context_window_size": 131072,
+ "prefill_chunk_size": 8192,
+ "num_key_value_heads": 8,
+ "head_dim": 128,
+ "tensor_parallel_shards": 1,
+ "pipeline_parallel_stages": 1,
+ "max_batch_size": 128,
+ "disaggregation": false
+ },
+ "vocab_size": 128256,
+ "context_window_size": 131072,
+ "sliding_window_size": -1,
+ "prefill_chunk_size": 8192,
+ "attention_sink_size": -1,
+ "tensor_parallel_shards": 1,
+ "pipeline_parallel_stages": 1,
+ "temperature": 1.0,
+ "presence_penalty": 0.0,
+ "frequency_penalty": 0.0,
+ "repetition_penalty": 1.0,
+ "top_p": 1.0,
+ "tokenizer_files": [
+ "tokenizer.json",
+ "tokenizer_config.json"
+ ],
+ "tokenizer_info": {
+ "token_postproc_method": "byte_level",
+ "prepend_space_in_encode": false,
+ "strip_space_in_decode": false
+ },
+ "conv_template": {
+ "name": "deepseek_v3",
+ "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
+ "system_message": "You are a helpful assistant.",
+ "system_prefix_token_ids": null,
+ "add_role_after_system_message": true,
+ "roles": {
+ "user": "<\uff5cUser\uff5c>",
+ "assistant": "<\uff5cAssistant\uff5c>"
+ },
+ "role_templates": {
+ "user": "{user_message}",
+ "assistant": "{assistant_message}",
+ "tool": "{tool_message}"
+ },
+ "messages": [],
+ "seps": [
+ "",
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
+ ],
+ "role_content_sep": "",
+ "role_empty_sep": "",
+ "stop_str": [],
+ "stop_token_ids": [
+ 151643
+ ],
+ "function_string": "",
+ "use_function_calling": false
+ },
+ "pad_token_id": 0,
+ "bos_token_id": 128000,
+ "eos_token_id": [
+ 128001,
+ 128008,
+ 128009
+ ]
+}
\ No newline at end of file
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..76c23843f7dae3f73ed9857e51278b63d3d14495
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,12575 @@
+{
+ "metadata": {
+ "ParamSize": 805,
+ "ParamBytes": 39688355840.0,
+ "BitsPerParam": 4.500214977904823
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f5e74599227c40ab689174bb88c2800"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "db99bc516623056f007ae98a3c75aa7b"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7a1783c591f23d770040417970dd701"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "83d0fc4b0122de280f1bdd7f81d0d27f"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbfcbdbe8776e1fad546b00e6c14e849"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1b1ded1aa9a3c68158ab490c93559850"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1bc4223e36096eb1e951e429a5308025"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb802aefe3b565ca32a6c6c3923a8fb4"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d9a999d22268fa98cb2585d9ac989da2"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 29392896,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 9437184
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 24117248
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 24133632
+ },
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "9cd3789aa0c451a24ef2ce0305b04605"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebe6bef2e21ad1093e8ef53eb1e49553"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b4b02c3ef1ade8dc6b7420ef9d1239b0"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "11dd577951de782447324f5dab9f4ee9"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bccf57a8801c76a43c8c8b6336b5e04a"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b822be096d5f20825a7c2e0e2e188bb5"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f1ce602693d73fa5f92cbe7b417f4f0"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4f46dca6d0a13181fbf3af081811e5d5"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6982920d3e5378844011a456accb176f"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 28344320,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 4194304
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 18874368
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 18890752
+ },
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 18907136
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "40269c60231442ebd841abd3168afc1c"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9338379683217c18f23745c10d54014d"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "18155eb577269f746ecfaf1031f61fdc"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "269a5b7ba6f3bd474edd3ff87c5f89b6"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7edad19d0a8c2283bfd095f18c628d2"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6bafa7580f0650ef5edbdaf29ccf1ca2"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "ee49814d64be0a111193659d3f228f95"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5e590be2aa17281d22c11ec6e41e6f78"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "36fcf268da4fadbda7c8b3cacd782dfc"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "70b133837036cfbeac050a9836ea9773"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7050f6351e279ab91d343e469c6a0503"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8bb9e86e24f45e0294864f5a05d2a932"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eca8c413e82304f4d41e867216501af9"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7906018f796777c94de03e1235b0f94"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6898759b6a1b1f85a9e508bcaaf68c80"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62d0a6ccec34c8780b1ee7f7eb314d03"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "043726272d9ce733c9200eeba31ee0e8"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a0676755ea49284b33b70929cc31e6fe"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c2b42ed2efc1e9fe01334aa9b156948c"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5d865ffbe521c767c62d2c36ad1f61dd"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a9206e78d3f6c523a2b71512783d9441"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4662e722826056fe45409389b60b4825"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "109ccb0bdae2988e95b93dbe23f7e9a4"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5d031e38b68b694d824b00b61fb4a634"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "bd2a66faa2f7316fc55ab1689578b3d9"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "660b66f50e7ee4b516343b04f750cc24"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0b051f1d778611d95eba6d8c01c3af0"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c7bf795af5985484c06d9ad25f2c1a97"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "678586bc757b0331520eacd2f8361ebf"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0b9c672a2c2961504ecb6a03d8c856fb"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "41dc499bf0377a0c27894bbf30e55573"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24656de65354137fb22ba600784afb9a"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "14f7fa64ebf149cfd05a74d1449ebde1"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26f6225dc5776e8366a0b4b5499451c2"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "96c1efec5ac67c683e87202de4266385"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42149964791fa82f30ea2cf2de9f37a9"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8e83ab28aa70ffcc548a5aafa3e67dd2"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5f8c96536c97c2b00822e33534d9ae35"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c52afabd9ea9c89c40794273b7286df3"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87e3b26b743ae27df328d1e9598b5b78"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ddb6ccadff4df9f4c32733c956adfd7a"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6ffbf00abfc4992f002537bdc1b84a92"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "cc0a14a2f404966e445a180f6630a50e"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59c18644ffcc273f50f6893b5189a0e7"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62c3986629ed42e2f5adf58089a44e03"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cb9e7703ae4ae58414beec652fd371d"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7e721b417ce449144e55252df965c48b"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e09dd1dec069cf4c34264759e13f00c7"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "67e8324762900ac7fe4b3be7e769057c"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "11d221b431d4cea70f3fb81b6ee780cc"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c02388711bad5f125b06af6698b6d95f"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7d7971ebbf688d3150418ab435715130"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d07d627612f970d32773c8b368a61989"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "328fb7194a0b88a74ae4e28df09cba48"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "446ba782fa98b28b16846523edaa1b62"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "153b7c69cf37240e76fa47600e45fda0"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edff7c1c0c1351c54269eae2918dc7d7"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ef5eba4bdb322692e9d3e4178d7a89d"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "591f72938c2ea91cbbad778f4176bb1c"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "519d27a8c39cb2431ab73e1ea77d9c33"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6adc628f512fbd6f68b07377f005e288"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7efdc64a30213e367e233bf506ee6063"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "036adb101c53b95ca8627856b273e2a1"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a939bce1a0d886f9e80a2950f8fad9f4"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff39117f3820fbd27e6718e0a0975b08"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e4915b90194dbaea2fec3dc66f9793b"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b52594bb32431274f23a204b04e4eb22"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c3e6954240b67ab0ed617c045c1fd250"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb0d8ea8c8da25ebc3006e4984511830"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e481bdc46a6493d2565ab1f011cf4d8b"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d9a9c1442465d89ca176f95d58fe3b2"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84bd008a623a81d5ca23d4a553c8c4eb"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3ea970ad965783cb3f311393a4fd8c8c"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "41d002699fd4f1309de9fc9e33b43971"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e1531b06e6c41c08164fe064d273f4d"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "542db9d7d9a5bb1be3e103d908d6a4e3"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c05d768fafbad54a0356d2fd3640c7f5"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57d3808109ff6367faffcc9cb34b3687"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "91eb1dac5abffe045fc363f5142b4db2"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "41a0b008b39956c01dbaa0ac77f9c599"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e3c3cfb8edec3f6f3247641abd7f4d23"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6fd6dcfef5cf44d452c6d1f0fa441cde"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b78c75da01f7f7692a3a7221be32d3d"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d2b2f16b30437147cdd3e2336747d31"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1458aee96bfaa4cdcc36a44fea3fa466"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0e6eb0386c79eb0d4f355017d51c3e17"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cce72bb84a8f4c0da8e1dbf71624bd94"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "43a96d17ac8d32b3539025f618d558f0"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "465045ea20f3bbf19b2372aa1a62caa6"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2403d7c40b03113acbd1871145ac53dc"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1ecc6679bf77b85442cbf8a3359c2a39"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "be3354129adcb336174df28214232df5"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2e4bb7d2f4eafc359d470568840ef80c"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c71b3b29ee081da4fb88b45f8580ef55"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9337bdcf73e0cb13f060a01f8788174d"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d12f5b4fbaebe380171383ec0bd74b0f"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0e24c8ce4eb494fcf990f7fe613cb6b4"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15f7e6c47228f5036e7bee0e451156fa"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d7fcdf15818a2f29cef70da67bc76c8c"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ef1a543e211e4becabf65f802d25005e"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16aa3deab37e17397334573fb6463eeb"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f40452819487b6eecbad18da87424781"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a5a031b9a3f0a75b8383f1c5788d0f2d"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9750b689f2b01f0e596a40727d5fccf4"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4593e4b7513f9a7140635bf6e267c10d"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8cd522156618d37f658b222b04bfd03"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "329ef02e065eec0ed8b4c310b3e00f79"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "842b9f8d739a471030b1e6b6ce5776d7"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "55152bcff6321d77651f46e8acc065ac"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5dd76a1651f5bc0e0e007a08ba04f994"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2c94300c9e9159fec8a6850108ec9bdb"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a8da8c542e1935d7e6e8a983916ab1cc"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "549325365966648cdc2b0b37c400ee50"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "01a57268b2797a658f61ad1471a394aa"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d564df6cd6e016459cef70979e317e1e"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "723e2fe37b4386489c12f6b1ffc1af76"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8b37aabf671f0d01a75eb7ef716e15a"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0f2d68d79e926c87adb6344283d7b7b4"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c7bff6a03f9c932d3d18c27617243d03"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5a5c97ecfc5ad3b60a5578786c568d9"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "00d52ed7bc4ca0ffff858c9328a6eede"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7d73b43e5269ab5d8c0b67add849415"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "18ca5fae8405abff77c06663f08d7d42"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2e3d9e023fe7effe11cced2ed7550b6"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88728e3e3d2647a8b3944a3b195eca3c"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4eaa2480172f911336a401c44401bde3"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6f344b82c7780c1f9f9a2ee6e5d19513"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4a4e599a6ed96f87235ba2261ec0ee4a"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2feafb1e4b7f874f74ac7980d3e470d9"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "75cf0f21ab0a7f0d837d2c6662922db4"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1dd07660663036e2f1d3b9f7eb7f4e4d"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b17b79a00599fe80bb27ce10fcc1d034"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "55e117e515d4bf1973cd9a29b6e87a56"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16fb56c4fb5ed2b04bd78f4804b52d78"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b9864c8837e9151d556d8a7a430578e"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bbc6ccb16b2a3f60a7ba6b017060d803"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "960ff57c964843f088be52574949aa12"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac5b211739a30c50a7a5c4e3f6b3207e"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "832bf22413e726a4242eb7b41bc4ae64"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b4923764cce29c5d680d9ead610b8407"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c7bf7c27957a39eb012d8f0ba34937a1"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "707639b35f3dedf8d2d0cf4628e0e367"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9083d99dd53ff63fbb45c4210201f451"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ecc3310c774a8cd13cc9d10076328e8"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e96dc2b6cfd17d133cb02eab8b0271bc"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d4764a646730b18172367df8eb28557"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37adf8a46753913c3e913a51aab1a859"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1697d4b55629717d75bcef3382939e92"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3054629bb410b61d23c4cd0d467b9e69"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0bfdd76fc2ce834843bc1a57a9592b9b"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "66151a706cca0cfcf13ef3e182ebe4c5"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7fc0fe5f099cfa12f136ff25b83d0882"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3d19466530974d1ce877f3d2edb5ad0"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7e89855eec67b4a1e193f479a1e5b0e"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85bae35685720078878a2378d51fef32"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "604297ea4f793df2fd675316a52cb908"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "76745db00e62886a70aa04f18528bc29"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6b5d2acf2e8be2671bfb89db787ee9b7"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bcb7f57170b1e63c194306ddde26bf39"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87d79049d0a6be81a42e13cafd7beda2"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "315d82715d6ef1b7cd23312ce753b82e"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "255714be9e01d9463abbde03e5713c0b"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a228e72ba9dd83031e48a13dd92d4281"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0ad4d0c000d31e55c174d04f4e14461d"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5b3c25707e873154b1f523e5117cce1b"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a33b318d03f2902184f4ba0a340d2e10"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "48e756030a6b7b97547a24655a712eec"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b3d2a6992933ba39c53f04d1b3477deb"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e92e9f2c855851ce97de12c7e7357784"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6c19b1f87a58e5e6cfd03fab5feb83af"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6ba430021cd6bf17eb85c8f3d942e70e"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f6ecce4e1bc0c2d692465af9dcb1cd17"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f441d44d2286a121fe9a511d83edb366"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "579447addcf4a7ce16058ac1ed87a218"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "7257b70cfed1bc42116080579af1ba7f"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a4e62c519189f5b4fd2d5e9c69d6b89"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "be17e08702b11d801aa37448120642ad"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9475a09dbb54549f2c31675596107758"
+ },
+ {
+ "dataPath": "params_shard_196.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "617a16f3f332e1467fdc2368b86a8295"
+ },
+ {
+ "dataPath": "params_shard_197.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "034d4a7ea29f196c81809f009b7bccc6"
+ },
+ {
+ "dataPath": "params_shard_198.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "10f49b31ed8ffee563ee8d0b8736c5dd"
+ },
+ {
+ "dataPath": "params_shard_199.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a0fd4c3845e38db25e398a2063ce56f7"
+ },
+ {
+ "dataPath": "params_shard_200.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "69dfcb2e0983e5650381b9ba5140bbd0"
+ },
+ {
+ "dataPath": "params_shard_201.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dec404dbcc16182ac9a5a37ea2cbf035"
+ },
+ {
+ "dataPath": "params_shard_202.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bc1fb22804c3bd111eb25839dc231154"
+ },
+ {
+ "dataPath": "params_shard_203.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6de1e368c25d64f26d28151f482181db"
+ },
+ {
+ "dataPath": "params_shard_204.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eebab0464c9abcdd6b77c3cbefa7b42c"
+ },
+ {
+ "dataPath": "params_shard_205.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "60ff484f88993e03a8f453badcfda390"
+ },
+ {
+ "dataPath": "params_shard_206.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "03e7349beb373ca0e9e4deb206fc4b0f"
+ },
+ {
+ "dataPath": "params_shard_207.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf1fc5e3fefc97b4a8ca3e7cee70c768"
+ },
+ {
+ "dataPath": "params_shard_208.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dffd13c3b184a64c39cf3acfaf5dc58c"
+ },
+ {
+ "dataPath": "params_shard_209.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf53ca89d73b601a9f177b182d6092f2"
+ },
+ {
+ "dataPath": "params_shard_210.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1c49c190226fc8211712f3b1b8653920"
+ },
+ {
+ "dataPath": "params_shard_211.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "22055b8b9aaa4595fbfa7df844b79762"
+ },
+ {
+ "dataPath": "params_shard_212.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ded93e0d85f45316060017716dc15dc4"
+ },
+ {
+ "dataPath": "params_shard_213.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "72e75a828a24fe61b446d57651b5bce8"
+ },
+ {
+ "dataPath": "params_shard_214.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2992a932a146961b345a7079a9664452"
+ },
+ {
+ "dataPath": "params_shard_215.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d177d163b6940fe6c0a61b9063ebb6f9"
+ },
+ {
+ "dataPath": "params_shard_216.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "fb382ac4c04565529c3fc8828dfb6233"
+ },
+ {
+ "dataPath": "params_shard_217.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eaf5134b38bf2e24555b125503482e5d"
+ },
+ {
+ "dataPath": "params_shard_218.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "35cd7f1d1cc41508ff6ec3582e6a91a6"
+ },
+ {
+ "dataPath": "params_shard_219.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d090f84737bc1bd048cbba2c80fe5f6"
+ },
+ {
+ "dataPath": "params_shard_220.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "efe9987c4094c7c62598b994f813e361"
+ },
+ {
+ "dataPath": "params_shard_221.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "abff04e8aa47e69f0a41209476abeea3"
+ },
+ {
+ "dataPath": "params_shard_222.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "94e1d1bd1f7dcc6509707afe6731d1c4"
+ },
+ {
+ "dataPath": "params_shard_223.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9a2834319370e6dadc2efccc65edb752"
+ },
+ {
+ "dataPath": "params_shard_224.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6017e008a73567c76fe946cfb36492ef"
+ },
+ {
+ "dataPath": "params_shard_225.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "71ead886a3687e6ca0c1b2babd6116e5"
+ },
+ {
+ "dataPath": "params_shard_226.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "424cb342ff21a85a6e9108f3603fdc51"
+ },
+ {
+ "dataPath": "params_shard_227.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3a4b6da277c8d572eb94590aeb50ba70"
+ },
+ {
+ "dataPath": "params_shard_228.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eb98afac840141f12510c9d1d4df6833"
+ },
+ {
+ "dataPath": "params_shard_229.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "53cab22161f19f5ce3613a11dea94b50"
+ },
+ {
+ "dataPath": "params_shard_230.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a28706990b763ed0a5019593382ecf03"
+ },
+ {
+ "dataPath": "params_shard_231.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "be2ebcc3c6b30fc06806a51333a90057"
+ },
+ {
+ "dataPath": "params_shard_232.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0ce9e87ccdb2a22b8d0ba97ba3c5ef2d"
+ },
+ {
+ "dataPath": "params_shard_233.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f24069810d67104d77ef6d26a9a2e4d0"
+ },
+ {
+ "dataPath": "params_shard_234.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "91f4c5717086fcca01d72fa14d06938d"
+ },
+ {
+ "dataPath": "params_shard_235.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6097e7c304dc09f3ddbf0c7502e542fa"
+ },
+ {
+ "dataPath": "params_shard_236.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6fa3c0e2629c8a572c112cd2267b420c"
+ },
+ {
+ "dataPath": "params_shard_237.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff98c417af076bcae3648c142e58985a"
+ },
+ {
+ "dataPath": "params_shard_238.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1bfcd469359cb955a933bbef2093ef95"
+ },
+ {
+ "dataPath": "params_shard_239.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f181b9788adbf872e9ec6bc0876dfdfc"
+ },
+ {
+ "dataPath": "params_shard_240.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "870ce34f5f103b7f1d0bfe3134f3d88f"
+ },
+ {
+ "dataPath": "params_shard_241.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "489d2ad5a79666d6b9ea31d5bd95b18b"
+ },
+ {
+ "dataPath": "params_shard_242.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7d902127092aaed807918ffbae507bce"
+ },
+ {
+ "dataPath": "params_shard_243.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3f69ecf21255f098ee6aefaf5236e7b3"
+ },
+ {
+ "dataPath": "params_shard_244.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "81239fbc9ef662ddfa1938f32624b5cf"
+ },
+ {
+ "dataPath": "params_shard_245.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d9a806edd5bb4e79ec1150568fcbccd7"
+ },
+ {
+ "dataPath": "params_shard_246.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3d78984dc0a0a02e3eb9a9cd69bf82a9"
+ },
+ {
+ "dataPath": "params_shard_247.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26200b505cf2690fbed14c37d65821a2"
+ },
+ {
+ "dataPath": "params_shard_248.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2621ad8bcf3c8a8498257c30b42099b2"
+ },
+ {
+ "dataPath": "params_shard_249.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "34acf2118b6829c5b6de8f2b3ca10196"
+ },
+ {
+ "dataPath": "params_shard_250.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "668badfe5a4f59b33156fde26c3aadb6"
+ },
+ {
+ "dataPath": "params_shard_251.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "48787f742903d7e55b667953b999b6c1"
+ },
+ {
+ "dataPath": "params_shard_252.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8aec31e865b525b2e8ea0d3fe71b6685"
+ },
+ {
+ "dataPath": "params_shard_253.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a8cb1e6eb17920abb866645d9c18dc3"
+ },
+ {
+ "dataPath": "params_shard_254.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "31058e7c4c35deff580dba6ffd176709"
+ },
+ {
+ "dataPath": "params_shard_255.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b7b8106ec5847f1e305b195ef98700b"
+ },
+ {
+ "dataPath": "params_shard_256.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9995ae3d7ab4b5247672f8864065128"
+ },
+ {
+ "dataPath": "params_shard_257.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "56a29a8e09ad4e0c40c3e4e5d592935e"
+ },
+ {
+ "dataPath": "params_shard_258.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "7df87c317ac9a49339e8fc1a5abe4658"
+ },
+ {
+ "dataPath": "params_shard_259.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6b7578bd18d7328550c4455a551512dc"
+ },
+ {
+ "dataPath": "params_shard_260.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c3a680dacf8e6d842873473fe23f5f44"
+ },
+ {
+ "dataPath": "params_shard_261.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d750d2c9478dc6ba38d1c1d0e2931718"
+ },
+ {
+ "dataPath": "params_shard_262.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "299d107fd9ab3123adc1286fe2300586"
+ },
+ {
+ "dataPath": "params_shard_263.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b64c91f7c46f48746500e83c606ea38b"
+ },
+ {
+ "dataPath": "params_shard_264.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b20f103c54407594a7fe20788749370f"
+ },
+ {
+ "dataPath": "params_shard_265.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "466b481c6ba5deeb13ad957b9e9eb372"
+ },
+ {
+ "dataPath": "params_shard_266.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d0ac3a48d455ed0df1ec76b87bd16bad"
+ },
+ {
+ "dataPath": "params_shard_267.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2ac2d16d059cfc3574e521610bc2927f"
+ },
+ {
+ "dataPath": "params_shard_268.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "de663dfdf2d5945384ce2b67b148f154"
+ },
+ {
+ "dataPath": "params_shard_269.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f36923ecfe7a5bd505ef8559d7899796"
+ },
+ {
+ "dataPath": "params_shard_270.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "395c4a5552a59a618a7d626cce5d7208"
+ },
+ {
+ "dataPath": "params_shard_271.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b6d7179a70785561a0a6ed5309888ff"
+ },
+ {
+ "dataPath": "params_shard_272.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c679a0df3f5e92e6d3339b8ac428e796"
+ },
+ {
+ "dataPath": "params_shard_273.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e1b81c070dbeceb39135d4c202af362b"
+ },
+ {
+ "dataPath": "params_shard_274.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3d8d8352e0830c282af512cbf3a7d2a"
+ },
+ {
+ "dataPath": "params_shard_275.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "091adae1147662150af5863f532cb72e"
+ },
+ {
+ "dataPath": "params_shard_276.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "396c4f3dc36e328a599375c5ada2f318"
+ },
+ {
+ "dataPath": "params_shard_277.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "715910e287747b7f7d20d03954f34b6d"
+ },
+ {
+ "dataPath": "params_shard_278.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c9b6b2aa642ce220c5918318d5c45769"
+ },
+ {
+ "dataPath": "params_shard_279.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf7a834f9ec146d7a956b24241e80367"
+ },
+ {
+ "dataPath": "params_shard_280.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fef0150714567dcdaeed6f925a84d1b7"
+ },
+ {
+ "dataPath": "params_shard_281.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19f7a50e653239f72ffd1c929882baeb"
+ },
+ {
+ "dataPath": "params_shard_282.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "310010d9ee4c241269a85f524502ebdb"
+ },
+ {
+ "dataPath": "params_shard_283.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7dcf3ea58586cbb536c537e6454b5524"
+ },
+ {
+ "dataPath": "params_shard_284.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e0e702c56ee82481f2820102e8a0a69"
+ },
+ {
+ "dataPath": "params_shard_285.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "68c353415dac3c064d86dbc5b3a16960"
+ },
+ {
+ "dataPath": "params_shard_286.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "14e025995405cceeb242ad7a245c276f"
+ },
+ {
+ "dataPath": "params_shard_287.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0facefef3618b7a601e7210755363bed"
+ },
+ {
+ "dataPath": "params_shard_288.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "2e7c4727372e41e64b66c0724f5d667e"
+ },
+ {
+ "dataPath": "params_shard_289.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4797897507e5d90a44718d86a5d7411b"
+ },
+ {
+ "dataPath": "params_shard_290.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eb6726bdc774170d5225df58501f1668"
+ },
+ {
+ "dataPath": "params_shard_291.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d78180e57b1cd29a82421939521988a6"
+ },
+ {
+ "dataPath": "params_shard_292.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b86236bee5046b03321d60c6538d813b"
+ },
+ {
+ "dataPath": "params_shard_293.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f016dafc758f955c246e93ece14fe0cb"
+ },
+ {
+ "dataPath": "params_shard_294.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1c6c14f1c31e217f16513410ce74b34e"
+ },
+ {
+ "dataPath": "params_shard_295.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c8e7b46befbc184de00d71f0d7b49e5"
+ },
+ {
+ "dataPath": "params_shard_296.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23e4c1efdc807e598c5653a7f59ae8b6"
+ },
+ {
+ "dataPath": "params_shard_297.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13ef6b657a238ec4159ca0c9ea4237c9"
+ },
+ {
+ "dataPath": "params_shard_298.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85ef4c5b54532dd908474a52a0d48807"
+ },
+ {
+ "dataPath": "params_shard_299.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "668977a5e9c9f463946548009888bda1"
+ },
+ {
+ "dataPath": "params_shard_300.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.48.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.48.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "4126e62458335028c9409c1e68b455f5"
+ },
+ {
+ "dataPath": "params_shard_301.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b1362ed474575b0ad77ad974e09e84d1"
+ },
+ {
+ "dataPath": "params_shard_302.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "feda34586438bd54523d40ccf1102799"
+ },
+ {
+ "dataPath": "params_shard_303.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "addd223cc24ef648a37bf79846e1a113"
+ },
+ {
+ "dataPath": "params_shard_304.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a26e41323ddcb083a6dcbdead33080b1"
+ },
+ {
+ "dataPath": "params_shard_305.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2caa9261542dbda273e0a667834b6ba"
+ },
+ {
+ "dataPath": "params_shard_306.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.49.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.49.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3ffaf477c1ae8230721ab326e606c72c"
+ },
+ {
+ "dataPath": "params_shard_307.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a3b71316acdccadcbe03e64adef43f7a"
+ },
+ {
+ "dataPath": "params_shard_308.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "69e8430806fe7138ec9463e9590f44a8"
+ },
+ {
+ "dataPath": "params_shard_309.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e0d7e744c6c162521be704168488700"
+ },
+ {
+ "dataPath": "params_shard_310.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6c747e10c677c6c7d9046f1b72688403"
+ },
+ {
+ "dataPath": "params_shard_311.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d24915e43cfa356b61221313e5c2b58b"
+ },
+ {
+ "dataPath": "params_shard_312.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.50.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.50.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b0fb953a904c0e92c57807d5b260d32a"
+ },
+ {
+ "dataPath": "params_shard_313.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b66b297d0ab1ff2e34221ec79a1198f5"
+ },
+ {
+ "dataPath": "params_shard_314.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2d8bd855a487d31e2275f4e282aedd27"
+ },
+ {
+ "dataPath": "params_shard_315.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f1a30af02430f98aef6c12577eadb9cf"
+ },
+ {
+ "dataPath": "params_shard_316.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "46058db992963bbab0b78d6e890b6b92"
+ },
+ {
+ "dataPath": "params_shard_317.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebfb365e591b36e00edf31303701f936"
+ },
+ {
+ "dataPath": "params_shard_318.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.51.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.51.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "ed84db204666941f82e57da6d2a20a79"
+ },
+ {
+ "dataPath": "params_shard_319.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8806bfb23abea78c84232e20babfc9bd"
+ },
+ {
+ "dataPath": "params_shard_320.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c2335087d48a6a2016bdebed1c59ae7"
+ },
+ {
+ "dataPath": "params_shard_321.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ffd7d595880a237148cd8ae355ba602a"
+ },
+ {
+ "dataPath": "params_shard_322.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55e206309e7a35ab7b5f66ad63c60bec"
+ },
+ {
+ "dataPath": "params_shard_323.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5dc99f9d4917b6fd2a1c90dc3b09da51"
+ },
+ {
+ "dataPath": "params_shard_324.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.52.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.52.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "855bb5a566e41bfeeb834be6f81dc405"
+ },
+ {
+ "dataPath": "params_shard_325.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9c56f32df3b7d481acf24dac25df7972"
+ },
+ {
+ "dataPath": "params_shard_326.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ef4ed9183f752eed57ac2428447852e8"
+ },
+ {
+ "dataPath": "params_shard_327.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85186906e9571253ad27edb540b06ec7"
+ },
+ {
+ "dataPath": "params_shard_328.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "68124a12cfa492a9c7a5506b0e2bcb18"
+ },
+ {
+ "dataPath": "params_shard_329.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "975e330ea6712b583d66f68bee36c7b8"
+ },
+ {
+ "dataPath": "params_shard_330.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.53.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.53.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "15ea420a140c9d98f158f07fc57c1b03"
+ },
+ {
+ "dataPath": "params_shard_331.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d15415c9bb221f4e031ca192c61c1a69"
+ },
+ {
+ "dataPath": "params_shard_332.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a288f49ad800f6637bfdb640148c687"
+ },
+ {
+ "dataPath": "params_shard_333.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "514e9b09765dd88b5ff2dda90ac2a70b"
+ },
+ {
+ "dataPath": "params_shard_334.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b0856512de0909264383098551a1bdf"
+ },
+ {
+ "dataPath": "params_shard_335.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e5a14db12b187563022f03232172b310"
+ },
+ {
+ "dataPath": "params_shard_336.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.54.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.54.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c982e6434ab28b3bf6d45af088802057"
+ },
+ {
+ "dataPath": "params_shard_337.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1bfd45bc7b133d34b11e7fdbaf369b74"
+ },
+ {
+ "dataPath": "params_shard_338.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e6691e95231d873a45e1631cd0fa64db"
+ },
+ {
+ "dataPath": "params_shard_339.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "273c5f87c35cbfc5f908e1c0a4bf0e82"
+ },
+ {
+ "dataPath": "params_shard_340.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8f61b31cef41b820e26d11d5ae1e6747"
+ },
+ {
+ "dataPath": "params_shard_341.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15129acdd1cfa244a40f7b39219e40ab"
+ },
+ {
+ "dataPath": "params_shard_342.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.55.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.55.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "37652e3ba6f2241f9145940a2b0bbc8a"
+ },
+ {
+ "dataPath": "params_shard_343.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "30e53772be7b43b485ab88a509fb1332"
+ },
+ {
+ "dataPath": "params_shard_344.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b054392dbd00e565e5a4f4a57915468"
+ },
+ {
+ "dataPath": "params_shard_345.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce8cb8f6b86e0739e116f8abe35f620e"
+ },
+ {
+ "dataPath": "params_shard_346.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "29e41e33adfffc0f23ffa5a6bf382798"
+ },
+ {
+ "dataPath": "params_shard_347.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8b761fc8df907c575b42cd3a5db17fa9"
+ },
+ {
+ "dataPath": "params_shard_348.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.56.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.56.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "248e1a6ab692d4f05d53437469bef209"
+ },
+ {
+ "dataPath": "params_shard_349.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "28af4885dbe406e5554ec582605d067e"
+ },
+ {
+ "dataPath": "params_shard_350.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c65863a797fcd26973670cf93ca1a37a"
+ },
+ {
+ "dataPath": "params_shard_351.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5d81c267914b4ad517cae714910f7359"
+ },
+ {
+ "dataPath": "params_shard_352.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "22650bbc1c69fa27dddae1c74f4e8e47"
+ },
+ {
+ "dataPath": "params_shard_353.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "267b00fefe99b5563457a4730e189691"
+ },
+ {
+ "dataPath": "params_shard_354.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.57.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.57.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "f1468e3496cee916cf79079c2deedf51"
+ },
+ {
+ "dataPath": "params_shard_355.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3c508649688c0d1c29a3990bdf63fdbd"
+ },
+ {
+ "dataPath": "params_shard_356.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "167dabe73b1deba4eb06ef53b4d6db8f"
+ },
+ {
+ "dataPath": "params_shard_357.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99e214ef736d822c0d45f6967a387b7d"
+ },
+ {
+ "dataPath": "params_shard_358.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0882637a5a47f2fc8d895b97e19ca1f2"
+ },
+ {
+ "dataPath": "params_shard_359.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ef763d04b7984523dbdfb8d7cc321a6f"
+ },
+ {
+ "dataPath": "params_shard_360.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.58.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.58.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b692b3aabd00dfbd7a2c4526eca0829c"
+ },
+ {
+ "dataPath": "params_shard_361.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b9c7a8a1b62f97805ff022200fa5dde"
+ },
+ {
+ "dataPath": "params_shard_362.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7120d34e9fa01b7ca77c2292c3469558"
+ },
+ {
+ "dataPath": "params_shard_363.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e7f5e2acf1208413b770a1726c56254e"
+ },
+ {
+ "dataPath": "params_shard_364.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "765964437e9b03a2ae951f3bf70eb9af"
+ },
+ {
+ "dataPath": "params_shard_365.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f576b1c6a4f0ee9e153cb46f0dc180f"
+ },
+ {
+ "dataPath": "params_shard_366.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.59.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.59.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e9fb54e0e15bb81ee0719eaf74d448d4"
+ },
+ {
+ "dataPath": "params_shard_367.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edaaa55343007b7a32a8e0981b122f7c"
+ },
+ {
+ "dataPath": "params_shard_368.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f160724dd200ce47f7fbf0d733828ada"
+ },
+ {
+ "dataPath": "params_shard_369.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "477c1fd7af280335c11cafd68d81556d"
+ },
+ {
+ "dataPath": "params_shard_370.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25c71f7f3b9d48394f0f930204a56b23"
+ },
+ {
+ "dataPath": "params_shard_371.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2774abe21d787f9020c9839a4faf565f"
+ },
+ {
+ "dataPath": "params_shard_372.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.60.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.60.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d9cf309f14543beb9c54ee758d20066f"
+ },
+ {
+ "dataPath": "params_shard_373.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6dbe1cf8f0a476ea64485640be12e909"
+ },
+ {
+ "dataPath": "params_shard_374.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "94e1b87a01381e807f6ac5dedcb82fea"
+ },
+ {
+ "dataPath": "params_shard_375.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5b9eb5c37c6ea03d00b433aec7d8ab25"
+ },
+ {
+ "dataPath": "params_shard_376.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a97e57b1a2c112096d5fdd92c35587c5"
+ },
+ {
+ "dataPath": "params_shard_377.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "98fc4fdc3aa28ae8ad53fba8d471f66b"
+ },
+ {
+ "dataPath": "params_shard_378.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.61.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.61.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "83c7888016389785ca8e9466b2b41671"
+ },
+ {
+ "dataPath": "params_shard_379.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8f817272f3eeabe5e1a7d2c7ca4813b9"
+ },
+ {
+ "dataPath": "params_shard_380.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "82531ebc2e4ac14233dfb329015f69a1"
+ },
+ {
+ "dataPath": "params_shard_381.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4a24278378e2abc5125803b2ff25bf8c"
+ },
+ {
+ "dataPath": "params_shard_382.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4c95ec67ed15f612d33813c02685e16f"
+ },
+ {
+ "dataPath": "params_shard_383.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0d43a30afa7f57c53b679a80a6616be5"
+ },
+ {
+ "dataPath": "params_shard_384.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.62.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.62.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b7a3b05f7fe1a3962f3b78163a982285"
+ },
+ {
+ "dataPath": "params_shard_385.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ec043c40e16d66c2e8ffa26be952c5b"
+ },
+ {
+ "dataPath": "params_shard_386.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b7ef21a90910a12803d4e79f50be3bad"
+ },
+ {
+ "dataPath": "params_shard_387.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0a3a968c7ca9780843ac0766e520ddad"
+ },
+ {
+ "dataPath": "params_shard_388.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c7598f52110b0c1d840d9431773fd10f"
+ },
+ {
+ "dataPath": "params_shard_389.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a0f31d8012bc48d6ee15ce183afa70eb"
+ },
+ {
+ "dataPath": "params_shard_390.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.63.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.63.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "f2ee3797604d8f4413c4df86c037c88d"
+ },
+ {
+ "dataPath": "params_shard_391.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f49c3e2d02b0ed8bb45adb2f4b11e650"
+ },
+ {
+ "dataPath": "params_shard_392.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4959a7a4fe61945e888ea3b8053e034d"
+ },
+ {
+ "dataPath": "params_shard_393.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "809bca1ed0e570af03b5b96c9185b612"
+ },
+ {
+ "dataPath": "params_shard_394.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "08ba42b52f1d902ac56eb765586052b0"
+ },
+ {
+ "dataPath": "params_shard_395.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2ec6752553b71385583b0cc85e13e3c8"
+ },
+ {
+ "dataPath": "params_shard_396.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.64.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.64.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "47df40bf42fcbbe9330de8452db32c30"
+ },
+ {
+ "dataPath": "params_shard_397.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2065f2f7b07ccef9bc0b0542d92cccf9"
+ },
+ {
+ "dataPath": "params_shard_398.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "642a43b9f74d436e71fbf453bba9d69e"
+ },
+ {
+ "dataPath": "params_shard_399.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85b20ed9697e240823af10e4868b648b"
+ },
+ {
+ "dataPath": "params_shard_400.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0fa16ad2c1cd8465ca27fb1e51a47bd"
+ },
+ {
+ "dataPath": "params_shard_401.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9a33229ac8cb774e46a00b88d9529371"
+ },
+ {
+ "dataPath": "params_shard_402.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.65.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.65.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "fae8cd60d019708966ff5e80cfa64af8"
+ },
+ {
+ "dataPath": "params_shard_403.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "83e9753da1e94f333c935f2910fef1fe"
+ },
+ {
+ "dataPath": "params_shard_404.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2f6ec29a28711373929ee90e3aed37c5"
+ },
+ {
+ "dataPath": "params_shard_405.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "629fa50befe958db76d7bf6cb28466df"
+ },
+ {
+ "dataPath": "params_shard_406.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "049b8a023c70714dc6474da294d8f872"
+ },
+ {
+ "dataPath": "params_shard_407.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ad215d593ebaa2da71c478b9d7149bd7"
+ },
+ {
+ "dataPath": "params_shard_408.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.66.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.66.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "76e2b53854bec34fc6320f039bc71ee1"
+ },
+ {
+ "dataPath": "params_shard_409.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "717264a93e96af5b10f77b6a6f7d8737"
+ },
+ {
+ "dataPath": "params_shard_410.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "344c6d2a06e3f13c06e6ebc993ba037d"
+ },
+ {
+ "dataPath": "params_shard_411.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fad70137074baf855af688f71c040c27"
+ },
+ {
+ "dataPath": "params_shard_412.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80b1e0bf9088a606d98c6ec653472b33"
+ },
+ {
+ "dataPath": "params_shard_413.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f89dca7b82e8b5069b66dabe73073dd3"
+ },
+ {
+ "dataPath": "params_shard_414.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.67.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.67.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "7f590d0262d8ba875a27cb701a031f30"
+ },
+ {
+ "dataPath": "params_shard_415.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bf1ffaac595e7a8ed91758567cf79ebe"
+ },
+ {
+ "dataPath": "params_shard_416.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b0f78febdd88296b06ebf2711a578a9"
+ },
+ {
+ "dataPath": "params_shard_417.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ddf82d110588d47cdc22df131fa807ac"
+ },
+ {
+ "dataPath": "params_shard_418.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "222225c7430979e226c03e0ea62ebe01"
+ },
+ {
+ "dataPath": "params_shard_419.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b42ef1fac67793c69aa827b39397b35"
+ },
+ {
+ "dataPath": "params_shard_420.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.68.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.68.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "99995bdbef7d54ea786da0d5b832d74f"
+ },
+ {
+ "dataPath": "params_shard_421.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9d5f0ef990487fd25bed24aac360171b"
+ },
+ {
+ "dataPath": "params_shard_422.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "20948c4d080275a144c5a24c61a0c92a"
+ },
+ {
+ "dataPath": "params_shard_423.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2ea5000615ee9682c82a7872bd1f8df"
+ },
+ {
+ "dataPath": "params_shard_424.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c68cb8832efc783671fb8f098cb7fe5"
+ },
+ {
+ "dataPath": "params_shard_425.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a4da646f71d01ead17842f1ffacddd45"
+ },
+ {
+ "dataPath": "params_shard_426.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.69.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.69.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c0a6f2893b045c33c22f151618a06253"
+ },
+ {
+ "dataPath": "params_shard_427.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c2e2b6a220717684388cf37ed741106f"
+ },
+ {
+ "dataPath": "params_shard_428.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cac5f4f50f81b87092546d3707441d34"
+ },
+ {
+ "dataPath": "params_shard_429.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6b73ce62871d2d5746e15dacbcfca325"
+ },
+ {
+ "dataPath": "params_shard_430.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c51867dea35d8deb532e6788ad49862"
+ },
+ {
+ "dataPath": "params_shard_431.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a17824c2cf42b320ef0dafa8d8b3994"
+ },
+ {
+ "dataPath": "params_shard_432.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.70.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.70.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8416e348687dbf11348bab7768d07142"
+ },
+ {
+ "dataPath": "params_shard_433.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1fe2f4551503214952f2a863c70cdb3f"
+ },
+ {
+ "dataPath": "params_shard_434.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9bf8e01f1929549ec8174982124c42ad"
+ },
+ {
+ "dataPath": "params_shard_435.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8d2d1237f08242d5b7edd3a25bd0a392"
+ },
+ {
+ "dataPath": "params_shard_436.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "02a79c6f1b017f2ac230f9f3759849e8"
+ },
+ {
+ "dataPath": "params_shard_437.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2ed8e8fa5dbe605671f9a14688bef3dc"
+ },
+ {
+ "dataPath": "params_shard_438.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.71.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.71.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5200be8c36edfe3091dc599caa9f2ec7"
+ },
+ {
+ "dataPath": "params_shard_439.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e61933faf96a5039317f2c75cd759e25"
+ },
+ {
+ "dataPath": "params_shard_440.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "991aea932ad579c8bc7d05f1afa7d3ea"
+ },
+ {
+ "dataPath": "params_shard_441.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "76cc1db24e45824a3c308abe7388285c"
+ },
+ {
+ "dataPath": "params_shard_442.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b5e4c6333d8e1cd8b11c9686097eb10d"
+ },
+ {
+ "dataPath": "params_shard_443.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "553471df3c6ee74dbeee63634c98da76"
+ },
+ {
+ "dataPath": "params_shard_444.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.72.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.72.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9af943f9256df0ef6e2f8a9e8229ec75"
+ },
+ {
+ "dataPath": "params_shard_445.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b2b2e5af96b0bbbc7d6cffbbb9921aa"
+ },
+ {
+ "dataPath": "params_shard_446.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a1da62b4103b0a25a9fea785dbbd8ab4"
+ },
+ {
+ "dataPath": "params_shard_447.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8d5331cbda0cf3a477a04dbde6b2230"
+ },
+ {
+ "dataPath": "params_shard_448.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a5b9e0f40e3c5b96adc8e5a4d9bd7b4"
+ },
+ {
+ "dataPath": "params_shard_449.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbcb6b58f0855999704a4ecd9e113fde"
+ },
+ {
+ "dataPath": "params_shard_450.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.73.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.73.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9b2e87adb075eaae329d79238976c629"
+ },
+ {
+ "dataPath": "params_shard_451.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acf5d871253ab601d364684891f98f82"
+ },
+ {
+ "dataPath": "params_shard_452.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "998fb08572d980ce0053b779ac546e2c"
+ },
+ {
+ "dataPath": "params_shard_453.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "11fd66edd06539e66af314e1ec9af965"
+ },
+ {
+ "dataPath": "params_shard_454.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a4260015fe3acf4a47d1f5bdfdc522ec"
+ },
+ {
+ "dataPath": "params_shard_455.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9d67aa2513051d4862c0404fffd395d8"
+ },
+ {
+ "dataPath": "params_shard_456.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.74.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.74.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "db6dc115490c934229e43a90553031ce"
+ },
+ {
+ "dataPath": "params_shard_457.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9bdc1c435b9f50bc4c30935439afb653"
+ },
+ {
+ "dataPath": "params_shard_458.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "00110c365e91fdf6895eeb679e929002"
+ },
+ {
+ "dataPath": "params_shard_459.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7098213bc764ad70fdc5a57c385daac8"
+ },
+ {
+ "dataPath": "params_shard_460.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e249634614a836bed13684dbe61a6c3e"
+ },
+ {
+ "dataPath": "params_shard_461.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb4d4c324e19709dc8a1a1f04dd2b736"
+ },
+ {
+ "dataPath": "params_shard_462.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.75.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.75.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "243237052f648c5a163b970ad323a269"
+ },
+ {
+ "dataPath": "params_shard_463.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "df5360a730ad561471839489b095482d"
+ },
+ {
+ "dataPath": "params_shard_464.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99c3af8be2da0d91803fd539d0219f35"
+ },
+ {
+ "dataPath": "params_shard_465.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "125ca1f13ae67a151c6bf8c401524f2c"
+ },
+ {
+ "dataPath": "params_shard_466.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3eda4b34fc1685930925fdbd4d965de3"
+ },
+ {
+ "dataPath": "params_shard_467.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "206d7806862e19e0e7233c393e030615"
+ },
+ {
+ "dataPath": "params_shard_468.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.76.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.76.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b8e1937be61c1aa0186e4d6899f920b6"
+ },
+ {
+ "dataPath": "params_shard_469.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fa1401a75b7d9026574cee2a835346f5"
+ },
+ {
+ "dataPath": "params_shard_470.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "90b054629563d4ac9413d864a640bcf1"
+ },
+ {
+ "dataPath": "params_shard_471.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "413700dae0cbe4bbcf612907bfad3095"
+ },
+ {
+ "dataPath": "params_shard_472.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a78366683615c50791f90c53eb448d3"
+ },
+ {
+ "dataPath": "params_shard_473.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ccc664e9ce8c644439849f2de8f98015"
+ },
+ {
+ "dataPath": "params_shard_474.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.77.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.77.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "dabd93d7ba32d09c4ae8bb2ad1ca4b7f"
+ },
+ {
+ "dataPath": "params_shard_475.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e45f9a271bf1c96b5eaf6b13d503f3d7"
+ },
+ {
+ "dataPath": "params_shard_476.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0a01fd6615c225eb55791bef63990e92"
+ },
+ {
+ "dataPath": "params_shard_477.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "baf19b48fa97bd7f282a0563a9d754e1"
+ },
+ {
+ "dataPath": "params_shard_478.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "980a76eac98b438eaeb9fe04903d37db"
+ },
+ {
+ "dataPath": "params_shard_479.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26c189280f5b1594caae139a3c2c7b54"
+ },
+ {
+ "dataPath": "params_shard_480.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.78.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.78.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c059f9ebdf234dbb1630b8f4f271e633"
+ },
+ {
+ "dataPath": "params_shard_481.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "730787cac5ba05aea86d7cb9a73cc13c"
+ },
+ {
+ "dataPath": "params_shard_482.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "49eb95dcae5fdec4009c154ea486cd4b"
+ },
+ {
+ "dataPath": "params_shard_483.bin",
+ "format": "raw-shard",
+ "nbytes": 14729216,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.79.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.79.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float16",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14712832
+ }
+ ],
+ "md5sum": "4bc634d100b8d489d80dacab3038d990"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..686a2a66a952d99090dc5d8d1002e7e4bf663c78
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f24c9fbbc6920629c876855111b3766a293cc06671d8145f1494147be5a61b7
+size 525336576
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2acd7dbc967b622eb44ff70cdad0a5e28533902
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9c8c24bf301c2d62a32504830c5349c1e3d97ac56e3986a8b8a3a2087be0ec2
+size 65667072
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07328507cd024888ac280498c5f266cd809bc4c1
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f37f62d1681a0360569fb0356563d5ae7c18d32fe04945f1471eb16045f61e0
+size 234881024
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa1dd6f3f83f73bf0e4a383250dc0dccb5bb1dd4
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8930ef36f34b354449faecfae6cf58da29644ccaf1cf7569c1126675e65f7e63
+size 29360128
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0d2484faecaae3a809e469ba4aa78c4e1566b4cd
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86b716c9985ff4b88ca7bd03ea871e4f63bfc36e95c66138f02c5298073b0bc9
+size 117440512
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4239c478db3ff2b4b127df502f87f67ae9557608
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d3d58693fb30ead9dc1cbaa166abf944c38cd55bf54b9d9b94a356351421458
+size 24150016
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..956764de2e817bf91d8d68a2d479ef2a25393154
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e1bea1a555358ec5fb81abe629dda7cae790b0be71a3b982339cd5fd0e9aff5
+size 41943040
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3395e7c51efba6af156ba72c3c86f71502a65d4
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b172436280ae8389ca8c9ebb9bd2daae07d2fabf4b320dc886efbc23d7908fc
+size 33554432
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36690ed727826343109f4cac3dc6d8947716e8a8
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d7bfa18718992f33b90bc777c8feaf616f9d6ffde01b9f4392fd8c4a47cf0d9f
+size 234881024
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..31b9addd555b75de9a927f1a111dcf0fe471c6f8
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a6bc0f4938131106297dd0014883bfac09fbe7c85364f7510bbf2f23a7ad97b
+size 29360128
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d4b7c257fc968ebd6b4596204928e23b532a7244
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5111a7e11043155deecd995410b33d7a66a437f2f93a98b203cebc26e098d00
+size 117440512
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c11bcb4ad5cfa99bc240468aabda81a8ca2846e
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77c84ef32d5e8eac0935e5d4b2e58b38855a64a762d2205b445b2cc2c5c2dbc1
+size 24150016
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..85f3237d63528c5dd92789028f4daeaebffc20b7
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d21a468c7f6569317476f9d924300dcb24b85e8409bc2a14b2c6a4e34a0375a
+size 41943040
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..938cfe2aa37cf21561b66b1ffd39977ee4895fbf
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3f8bf44967d621638f96b9de3ecccc44acd46e44ed64339478777972e0908cff
+size 29360128
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6992a833b2679938489a99dc1ca7739df6d5ccf9
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d4b63b8669bd9af949400e445b97ec346d245a70caad68e55eeca80e9c3249c
+size 33554432
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b48a94cf06d4da6b2554d1c169cca292a163e53
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:086f3976daac47f7a5c921c1e8ab663379f9dab07cbdd4a3fc3b8c502b9bad57
+size 234881024
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..360c2ec5dcdd516ef7c835c6674ee304342b0af0
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25df3d30007e472f000b834eb08c4e586c1f92da7d66b3d27ea334110e11d463
+size 29360128
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4ca392bc180a8ce1ab376cf0602e61cdcb5f318
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a575b41f389e9f36309eee57d552145b8a7646e353726f4306311d4f12199bbe
+size 117440512
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b4dbd93bfd20d609fa50baf987b10edb01d8f7e
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6557f1f1ed51bcac1cab52b1f4628d23e5683c5b3bda13152a3ead429a50d332
+size 24150016
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4014749b8f50048ea0c9a32552682758ed1959ac
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f241066b7238a36d5303cf8c9fd772d4e28e2e2bb132069eb70127b6b571368
+size 41943040
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..68f3913dbdf14efeeebf13c369a3b928d9bfd63f
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5c590ca2aee560a781875c48bd6b48db4ca6e92a681d1f2f82aef22fd3ce440
+size 33554432
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6cd552dfc110d659604e4c5e0c30a0b6fc541783
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe8ba31d7e2a19be6b2e23147024864216f2602352149b887583e661729146d
+size 234881024
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d8db1b8aa12a65dd64918f2169f2f6ce79768f9f
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b963576b1387bc1c6b5fdb4f70912892ac8a4c0ba03c4510b7d3a20cd03eab51
+size 29360128
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..878c5ed45626016d10d89520c2c123d1a729fb1b
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:543f55987600991106d03bd66fea20e1428a0e4c681cedd27ed954845ecb8f19
+size 117440512
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e493f57edda5ef7ed330490183ffc20b88613d2c
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:66808c7061150f58165ac7dd2dfda33aa5e07dbdc27020329c61d938061dc38e
+size 117440512
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d8ef914080abc0830ce6d5728305de81edf37578
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e7edec0c4e3fd748b93404d895106e55870a179d45647b4ea9084c2def049559
+size 24150016
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d1b5b2cedce4d76256bf7b04582740496e1d4e1
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfa9bf3e125ac8332e2e041d61fee289cb4484e7ddb2ff03fc77b80a5ed55a4c
+size 41943040
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1eaf4f5389415105905efbe235c2850760b0a930
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9575ab3ca1dd7e46de8129f3955d168fab0686814d086c23448d45150b78c1c
+size 33554432
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3aaa7eb52abd5eb2e58c7e811fd45015def07122
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0dec7c452370c7ac81844e1c93d4e0ce0bb727c9d85b99d0c66f4aaac80efc6d
+size 234881024
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cb7fc9850b5c4e347b0e70a2ca448393b787b8d
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6a789adff8d273f87d671ffb839ee14534af5a5600a6d53137c2768ecbcf6238
+size 29360128
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f21ec150f1fc347a1d3ed544cacd625cc95d45ff
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94ca3545d9f7f1a619ed2582e09d4303e2e459d48f9826d12b701c9c52abb8a7
+size 117440512
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..604594528a6607e769e643ae9f58a0a6f2f1d251
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1799d3c2c53d6951e36082446b44834acbb82f20a5db8583de4ac13cb414e6a5
+size 24150016
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0db24566c3464330ada280e20b2454e5ece213c6
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:103a668018b91208ff4e20f51c7f034ed429158621877958a661c657fa69f007
+size 41943040
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b983438c33971e836bf948e42a293f17f552b67a
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:364e2ad330c0e9af06ed9c5e2fbf279152b11065fa345361baae09b6f5e06933
+size 33554432
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..50c0840d23ae1e05487cdf2218dd565931546332
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07be00ac56dd1a3fb8980c948bd770c5cbd8bec49f219352fa2dd0463c9ff92c
+size 234881024
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f7b9907b1ff3f85aa58923818cb3e7b5bd1762d6
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:42baad1d9134c150d311cf4003a61b401cfc7a93a55aaf35d96e1313605c0539
+size 41943040
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1df004286471250cb0968ad1da7103d0d5921063
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2d7dd08205c4bbbadae1d34da1cca55e0ca3644f9fba73fd48119c5e78e09fc
+size 29360128
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3f5d87017ad1d7b6112739d5470310621daa605
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd3ce093595cdf6c5f8f5067429bf124552dc624cf9131af38122c67787a60d9
+size 117440512
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ae57516fb6f92dd0bc7a67e0917de4ceb023f3d2
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b9fe5dcbce1ffee2f746042c4b7e05d4a8200240fa702a2e88ed766856fbd94
+size 24150016
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b310f46052d693674345ab7aaf009aaeb955d4a5
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3ee5c86049ae401baf1e0f63e566de3a4fefe890ae71d109f8af2b11a45ab5d0
+size 41943040
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..234a3916e6f405a796230b0dafa0148211399cee
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d045f90737fe2aa114ca0e5226ea1038a0464693478ced0e382ece85ef42e32c
+size 33554432
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..12cbee9284ec60b55a7df86f715f68c2e42533b9
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:432646db728dc8cc411a12cc223e70f497810c569c3e9889c82ba1be2e12817b
+size 234881024
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a297e65638a2856f8caa8adb12253da4370c543
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:73ac714308cfd9b24499ac1b12d9f1e5779881397ffc8c8525810eb31015a9d5
+size 29360128
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..faf65fc9f47516a27c122805a3a5a5e48ca13ba2
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90e47b91094f9342e6716378794c232c19bb6a6cd1fed0e777760bc675dc201a
+size 117440512
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..577b1b97e681d2e7520730e97bce5c16e9655b7e
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38217d06ff42696fac96006b061a676ac1231900fbf64a32751ae83c92b020af
+size 24150016
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7e90992939e457d783be0ab6ee6a52186f0b43a
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4a41511014e9e25e810edcf6bde878f07cad3818120236454854abaf4205800c
+size 41943040
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..35d2dd0a7e1e9e391055cd0ea6f14c4db938b104
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c67885fe3300a3b81cc614189327203e11bea3eea97055f10ccfa1e56953d47c
+size 33554432
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8bce0188a25c50fba8d7684ce3178f18a3ccea31
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8a2f8ecbf2dbd8edb758939e021917a5f9817cda556034f5d85f5c57c8e654a
+size 33554432
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ac710f4911b1703b548337a697f83f71f161c53
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4993c55f8ae14f77623b43adc336e3a69833c2046740fe1e83eede143aed5976
+size 234881024
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..32bfaded5c7bf1cf7433dce1f813e2d2ee40a7ca
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b5d4f91cf8c8f59b0b101c9997b04d3fc317c4b320200aec8409670eb9b716a1
+size 29360128
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f90295b71e1a439c073010727a02e96ef0822e0
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:14f6426c19c46527601310bb1535585fb99c789d6a5a4215ca8071bcc2feae2c
+size 117440512
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d1d4a8843fcc16752b95c90ab3e26f2ad0b750b5
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6707bb1d5c523853eada9983bd4e3b0f36f91dd93acd1e2563bc93c601018933
+size 24150016
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..68e3103fdcf185debc73bcb0ce0f71476f07ec77
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79b35ba9cc0026c5307aad5661b92faccb3a04a4d86eaba4e0fab3bac57b4245
+size 41943040
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4dac4cbebe5fd16d926121b3a74a287b1b1d23f
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23c4c54c4a679b7f1dee0603e10559d6ac4d438dd037aa8e2c960efc1bbfdf2e
+size 33554432
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5e65cd67d66afb43d87166da868e083c002e5138
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea94e2b9ef19d4b78dd290bff93a0db66fa6bc44d2d430a9c714ac62f775a7c
+size 234881024
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa5f1e67b671940df890db65346eb59a339c18b4
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23fd8e46f2a7c3698b27e156965adba436af68dac8c80bbeec86ea1aab25692c
+size 29360128
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b6659a41e18544171a04635683a5890e386895f9
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb430efe77e617890b265bbb3674fce2de67012c07cb08d4a5ab6f79d6857637
+size 117440512
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d76a73a7de94ccd637f8d11ae1d4e34ae6dbb20b
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:047551d6f3c326e03bd179241b0f8a81ea3af7d6ea44b03f8751e92c1f599d3f
+size 234881024
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8826ebd7f3db01eb8ea9fa76767751c70edae35f
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40a3b2d8e54c0591de0ddc2547e86c596bb67382c4099aa3331cf799f0910ef4
+size 24150016
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..992906b187e26ebf04c5869357c7741eb90c3de9
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dcfbff13a5f1e02fe1bccdf7f1b4aa651dcaaf64e64143029483655acec06ae8
+size 41943040
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07a654f7f71ad6529e98d51917223af8d57b6945
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1dcacab39440fcdb7d04471a5aad1b72ef985b0f6cac2b8377022a7e3d921fdb
+size 33554432
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cfed1881388bcdb9b38bb85259a5365c45bf387f
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3b0e28e0e37332231751e899776d19690cada8a53645f5dc3dc7df4bf7c4d98
+size 234881024
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36ca37956cc55c2a8cabd05b1a2b0f78d41f6f74
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fcf14271c7eb27d714b211511a86f09e88547febf98c574e525a0422b0c43540
+size 29360128
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..260ffce858a3f870196c2b6b80f499ffc9431074
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df12d927fe9ff3b0e4a807f46cb402803da9007f9018511dfda83eb67cc9b852
+size 117440512
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ecd4fd4145ee27ae02e8be48d989efdec0ddaa37
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c061ba823f678c63f393461547f39c8580928932f9d56e9be7a9e1a49ace176
+size 24150016
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bb3c1c998fda42b14b5e06588d31dd6f9db97d4b
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af1a95d4ae5e56c08f2e98f504f496f30fe04886ba1c97061cc52c3e0a07c020
+size 41943040
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..602cb32f575428213b600da8505ed3e5cf84c96e
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56a0b6c5a39d05d0cba3e189b8d34abbcfd00ee75d22334b29313517e0cfa4d2
+size 33554432
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..093d19cec85dbf2778a1e1e45eaf59366c494a09
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f475258b7662efdc4faba0bea7150e17de1d9d63b6a01c1e70b55c3362334a9
+size 234881024
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36f50bde7d20c053c3b58bc53d11c95b0df99459
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ca599e746acf005922d79254f8d9ac3d56d10db59f7fee90e8f0e47f3da574e
+size 29360128
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..27dba655433f4e63847699341a007d3f4e11eb53
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0aaafeb3c56be7601c7b1482251b4d1d8e47d6cca781e3fd23e3d799b8c2c5a
+size 29360128
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0067aeb304683a303a3e4f685d678c33bc114652
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:455773c6c456bf615ba6bcdc9358e130d44e03049907aa2f55788b094ad9a950
+size 117440512
diff --git a/params_shard_162.bin b/params_shard_162.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0f01ebfb800b75a625d665348dd95a0962d65df
--- /dev/null
+++ b/params_shard_162.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4330d874df1dfcb0e2a0dbb397823d30ed285b26f85fea59f05a1ec983f6b514
+size 24150016
diff --git a/params_shard_163.bin b/params_shard_163.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0b031305befe66f4018cb09653f83bf2c4834fab
--- /dev/null
+++ b/params_shard_163.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5799ba156895f0d5f7e6c87ed5ed3255943d03b89a8d6b92cfcc88941def92c8
+size 41943040
diff --git a/params_shard_164.bin b/params_shard_164.bin
new file mode 100644
index 0000000000000000000000000000000000000000..62f6770ea990fed5d5e526d8a9d4dcc208e00ccf
--- /dev/null
+++ b/params_shard_164.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d355d506200cfd4d1d3a63294717f4dcadf50d838ca0fcc2b4ce4c2bbc76d346
+size 33554432
diff --git a/params_shard_165.bin b/params_shard_165.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7500e4d88eccec38c369cf1e2a4a218ce09b71b4
--- /dev/null
+++ b/params_shard_165.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62a8c3f540fb1cb3ed1bf40ebc2d5139c1cf29a361e41fb500b082933b335405
+size 234881024
diff --git a/params_shard_166.bin b/params_shard_166.bin
new file mode 100644
index 0000000000000000000000000000000000000000..98a2c72410ee815198b313c0e6bf3e67de98807f
--- /dev/null
+++ b/params_shard_166.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:738b12d6acf493ed0ac290a2e917c2920e5ab278314c480ca5721097335eaba5
+size 29360128
diff --git a/params_shard_167.bin b/params_shard_167.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19b3645c42b500b828ae9d2b8742ffeaaab476c5
--- /dev/null
+++ b/params_shard_167.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:11e184a4e0a531d7066d8d2384a14005276aaf3f7a9dcb0b8066c03f37709828
+size 117440512
diff --git a/params_shard_168.bin b/params_shard_168.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da872600d97f9a8410df1a92d1d39e8951dee3b3
--- /dev/null
+++ b/params_shard_168.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b1281505a62e9c678a0a76c4b5a2334e36e19a9c19de555c5b316796af09fb8a
+size 24150016
diff --git a/params_shard_169.bin b/params_shard_169.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9fe34a883add4c078e22f0360b4409ab94993d73
--- /dev/null
+++ b/params_shard_169.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dcf15aea724f9161e7579a91acd15cc82ee5780716211d2dce07998842449de5
+size 41943040
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..495b2b4a0306b2345650ff23094989c224046f01
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:155f2879c5797b2b61269fcb78824551caca64ec7d46dacd54d0d356102b6b8e
+size 117440512
diff --git a/params_shard_170.bin b/params_shard_170.bin
new file mode 100644
index 0000000000000000000000000000000000000000..426601230f4d7e7619e95994b7147605c8cde800
--- /dev/null
+++ b/params_shard_170.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b8491f60c215846015d9f4bf697d49d8708a1fc4c52c0b33849b8fbd2df065e
+size 33554432
diff --git a/params_shard_171.bin b/params_shard_171.bin
new file mode 100644
index 0000000000000000000000000000000000000000..71fbf5fe672a40752efa82cb35466140e12e8510
--- /dev/null
+++ b/params_shard_171.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c9c555a4662752177f80b2eb8189719071804f5d58f99f03353ae374ddb7cb4
+size 234881024
diff --git a/params_shard_172.bin b/params_shard_172.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c765938037f22d70f038b4183783258e6a93671a
--- /dev/null
+++ b/params_shard_172.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e5deca3d801f4e54cd70d2d6bdc3cbb0fd2e340833ffc1ec69e90e0cec4eca34
+size 29360128
diff --git a/params_shard_173.bin b/params_shard_173.bin
new file mode 100644
index 0000000000000000000000000000000000000000..503d8d852d09ddcf80dfe0c7f665db9a6d96bcf5
--- /dev/null
+++ b/params_shard_173.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:789644edc68cbc2c993645494a8582ae88814c17269f6b443a4233798bde13ff
+size 117440512
diff --git a/params_shard_174.bin b/params_shard_174.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3cbcbb6e7c98d94b3668c38d140b6e5b7ad1320f
--- /dev/null
+++ b/params_shard_174.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58e6090d209a809cdfb96355db9058fb240a96f1b3685b9becf0f715adc86dc4
+size 24150016
diff --git a/params_shard_175.bin b/params_shard_175.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3fcd5e350740df97ad6d6b724546fa2272f603f0
--- /dev/null
+++ b/params_shard_175.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2026afe8ef418efddb0355f601d810448b4c49f1a9c7d259a99dd928712aecdf
+size 41943040
diff --git a/params_shard_176.bin b/params_shard_176.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c4f4c088a75bc9e19b67bb8ff9f63fc2a363e7b0
--- /dev/null
+++ b/params_shard_176.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a40c93e212c202970cb63c316c18f871d5c0bffe7007132058cffd08e430ef5
+size 33554432
diff --git a/params_shard_177.bin b/params_shard_177.bin
new file mode 100644
index 0000000000000000000000000000000000000000..977a03c313f6c86246859596118bfe45a399d1c0
--- /dev/null
+++ b/params_shard_177.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7520651d416b077b4a84c0acff65004db69f2f3496f995b27e9e42bb0af07e38
+size 234881024
diff --git a/params_shard_178.bin b/params_shard_178.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f02a031af68502dcdbdb73998ea8caf7a3f54945
--- /dev/null
+++ b/params_shard_178.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9643f6849f43ff60c2567c2100133aceafb5cb88fb13db9f0a5306267a3b98b
+size 29360128
diff --git a/params_shard_179.bin b/params_shard_179.bin
new file mode 100644
index 0000000000000000000000000000000000000000..43583b52e0aaa81d50769741db963fd1885e85b7
--- /dev/null
+++ b/params_shard_179.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69c37996b0b22c1b66e57266fef78970cdd1b7ca12da10f1a49233f1ccb4a7bd
+size 117440512
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b13ab167bc42c19ad9b2c8b0fc92d8df2b2b0c8
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a9d6f994ca64da7c43887535e17ad2d5a3847bd6c4077b02b8dadaf5d6aea19
+size 28344320
diff --git a/params_shard_180.bin b/params_shard_180.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b862980e9473fa116132d83cc8a5c57b1961843
--- /dev/null
+++ b/params_shard_180.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:530307734bd73fa3011b0d76608a541df0686fdb407dd069dba6a5b3e6847189
+size 24150016
diff --git a/params_shard_181.bin b/params_shard_181.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ae5c147698e3d6f25367b33f80bbb7ebe0673bd2
--- /dev/null
+++ b/params_shard_181.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f9ae9b2751cb7af9bb51677fceb7306260d7d56eccc8bec7d843f0d5d2cb5609
+size 41943040
diff --git a/params_shard_182.bin b/params_shard_182.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e490e19ca2f691d56ca1e4c821ce6f3be69ec5e9
--- /dev/null
+++ b/params_shard_182.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:265e5b50384c5aea28c86c51ad3c422a04047e1aa005f5d02aef941dc2d7dac1
+size 33554432
diff --git a/params_shard_183.bin b/params_shard_183.bin
new file mode 100644
index 0000000000000000000000000000000000000000..684caf357e3f45b5b7c953d979e8a93623f25197
--- /dev/null
+++ b/params_shard_183.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3567414b9a555c07be27499ab32af0bc1f4e44da452082230eb37ad6a306ea8
+size 234881024
diff --git a/params_shard_184.bin b/params_shard_184.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2920793de559786bc61439448ab0acf8cd3d7cf1
--- /dev/null
+++ b/params_shard_184.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7aff9509bfd60eca026e1e97ec843fbbdafdd976b8049f64ec5cbbe3242ce89f
+size 29360128
diff --git a/params_shard_185.bin b/params_shard_185.bin
new file mode 100644
index 0000000000000000000000000000000000000000..10ba889baff6105ac58c2c1d4c8317b7ab793a24
--- /dev/null
+++ b/params_shard_185.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62251364c799508d3fa858d0fb1dc106e6b0f1282acbfa2c79ee22121c42bf33
+size 117440512
diff --git a/params_shard_186.bin b/params_shard_186.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f8ed842fcf87548c38611eb5f29253ba6e7247d9
--- /dev/null
+++ b/params_shard_186.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:470fb6a75362a3c95f14faa04abfc1fcb7ebf8423d1da9c7b3bd1ef6739dfdea
+size 24150016
diff --git a/params_shard_187.bin b/params_shard_187.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4c59a030dd3d58bb8c3b24231d2878c5e4f82cf
--- /dev/null
+++ b/params_shard_187.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e4a8ab0b1c57416c6821881ca2d461f339357b315957a97047f2de096003a68
+size 41943040
diff --git a/params_shard_188.bin b/params_shard_188.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e9a7f9c1982bc0e7152b4d4c012aa372839df273
--- /dev/null
+++ b/params_shard_188.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b34deb763d4d100e9dfa2b1d844cebf559614f0e7efa49124211a2893b9141a2
+size 33554432
diff --git a/params_shard_189.bin b/params_shard_189.bin
new file mode 100644
index 0000000000000000000000000000000000000000..263f10144c836df8b639abd6a40427670ccd7b24
--- /dev/null
+++ b/params_shard_189.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e66035ca63c7dcc88f3b810782ae88cde3f072ef61ab47824999de9d6436b1d2
+size 234881024
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c92a9449430f1101f9546a1425d955e10adc7c64
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b0158f91e80149216f93a43c3d60ff4d5bf1762a75515db000f7bf9483a77b9
+size 41943040
diff --git a/params_shard_190.bin b/params_shard_190.bin
new file mode 100644
index 0000000000000000000000000000000000000000..67f7f8ac054cb7dadf774fc556214d623af82251
--- /dev/null
+++ b/params_shard_190.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e7874010afb7fedb23e69db645003ecb91391459e85ff50350af7822763cc66
+size 29360128
diff --git a/params_shard_191.bin b/params_shard_191.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5703b45aae5ff9c88e07ba561e53e4862fb8ce60
--- /dev/null
+++ b/params_shard_191.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ebadf300d26d3a6bd2a24834f6a115e9d7c16b37a2a5b9ba8c356a7ed391700a
+size 117440512
diff --git a/params_shard_192.bin b/params_shard_192.bin
new file mode 100644
index 0000000000000000000000000000000000000000..35da4981236c21a3c98392a90041e4a78bcbb455
--- /dev/null
+++ b/params_shard_192.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:686fec831904d4f59387a1bcd3fad810037a9bc06944d296a176a802d4a56262
+size 24150016
diff --git a/params_shard_193.bin b/params_shard_193.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8ff19355cf4694e08d62fae61c2360fd0a3d1ad
--- /dev/null
+++ b/params_shard_193.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f786448ec5358c5d6cfc056c5898192082db79362b52c3cb18e133f2801a10b
+size 41943040
diff --git a/params_shard_194.bin b/params_shard_194.bin
new file mode 100644
index 0000000000000000000000000000000000000000..91d51a33c87c81fafad3bb50dad48d15a3cdee47
--- /dev/null
+++ b/params_shard_194.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cae24b02872c0554c716f57fe5adc589fca5e217b9e23b5deeac27f3e9372478
+size 33554432
diff --git a/params_shard_195.bin b/params_shard_195.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c02814e2594e901e3cdea0d4aafc918e6a00dfe
--- /dev/null
+++ b/params_shard_195.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2595ccf822031ef180a516ae4cdf09c8304d26f131423e71250aae227f036fa0
+size 234881024
diff --git a/params_shard_196.bin b/params_shard_196.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc21bc43f41cb33f0e759a862b0aa5add3e63bb3
--- /dev/null
+++ b/params_shard_196.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd3e9903f1debf7bb1e7a61320ab5ef3241fe2bd09594cfed1085bf12f263691
+size 29360128
diff --git a/params_shard_197.bin b/params_shard_197.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0725f3f491f882a365b0e715dde0e379c3026929
--- /dev/null
+++ b/params_shard_197.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a39cb3ffcd5b76ab9a13358e70d54e88ed2a0167ab135f2be6d621becd5b2b36
+size 117440512
diff --git a/params_shard_198.bin b/params_shard_198.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a4bdbb4fb6f4b016c3086063afa6f1cbdd3eb15
--- /dev/null
+++ b/params_shard_198.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d6ece906a40a0d72fcd5f299acfb2dcabf8789ff189b36b04b475d0a35b167b
+size 24150016
diff --git a/params_shard_199.bin b/params_shard_199.bin
new file mode 100644
index 0000000000000000000000000000000000000000..283bf6159e7eaf91a35c9ce7600f398a9832da9d
--- /dev/null
+++ b/params_shard_199.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:03e44918f6cdf8495b771f77fad6375051661b81cde0a821803c0b9ab09a6195
+size 41943040
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..263aca5fd4582d1c14c4504e1628e684acf41118
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab0041eec73afcd75cfe4d41327eeca202f9d021f4a1de7410d503614b20d873
+size 41943040
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3449c9e9cd09aded7bf7db8919629c7ad33c1697
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98ef45cb3dca761e9208470e6b094c600560cb691b660dce0bc98e1c607d788f
+size 33554432
diff --git a/params_shard_200.bin b/params_shard_200.bin
new file mode 100644
index 0000000000000000000000000000000000000000..df6d1c9972981161e713be6018946b2837ceb39d
--- /dev/null
+++ b/params_shard_200.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41ffcbd63c11771d8f7e4cb0ce3c84a5bc5b9481c766bb45b106a466002b3f1d
+size 33554432
diff --git a/params_shard_201.bin b/params_shard_201.bin
new file mode 100644
index 0000000000000000000000000000000000000000..805fc64485ae623a3c8278087858645539739c22
--- /dev/null
+++ b/params_shard_201.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b46a8abe170b330d6b280f6547d3d5e989b720ec3b8555e1cd308e27b1f62b47
+size 234881024
diff --git a/params_shard_202.bin b/params_shard_202.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74610eb6436529244e7c2a1c3bc7c46b6b64b1b1
--- /dev/null
+++ b/params_shard_202.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a1e877771e1dad431cdab1dd649a2f5468720c32b694bcc80f2ed2a04978867c
+size 29360128
diff --git a/params_shard_203.bin b/params_shard_203.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e80e7b124641705685e40a452ea66e438bb1998b
--- /dev/null
+++ b/params_shard_203.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:663eedbe21898493b6a2a19ca5388f360e008be0af45e01f4088ca27d9b268e6
+size 117440512
diff --git a/params_shard_204.bin b/params_shard_204.bin
new file mode 100644
index 0000000000000000000000000000000000000000..27700ca2022a1ae6e053c40b729fa66d04a9efc6
--- /dev/null
+++ b/params_shard_204.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab0270bb84729f8fe7f796c0db787a0d326297f4881d0c8ecc062e7cf8aa2c54
+size 24150016
diff --git a/params_shard_205.bin b/params_shard_205.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d6777857b99ca1bb23a421f0607a20fef6dd5855
--- /dev/null
+++ b/params_shard_205.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:595c34a7b6b939083c1ebbf8449a373549f5b909a799153ea2637f68902cf5be
+size 41943040
diff --git a/params_shard_206.bin b/params_shard_206.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06c5c0e4c6c6bf2abd34d75c197dcbf65ec5ef1c
--- /dev/null
+++ b/params_shard_206.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3939a244cf41310797dd9cb04ef22769a7b9fb167f932adacc5f2f3a0633d861
+size 33554432
diff --git a/params_shard_207.bin b/params_shard_207.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f4551829dad0189a0162667b23ba6cf852b1eb58
--- /dev/null
+++ b/params_shard_207.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ee8f9c4c9eaf6d592923c89cb2ef6ba3cee2a91c5d094492c9fa9f08a7e77367
+size 234881024
diff --git a/params_shard_208.bin b/params_shard_208.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e600e3821c063180802b967db9827366d0bab09d
--- /dev/null
+++ b/params_shard_208.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8966e5db08829480f1eeec5a82aeff4b31d0a88dcd04c21c32a19b332eeb047f
+size 29360128
diff --git a/params_shard_209.bin b/params_shard_209.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b9c697a1c1368dccd86e5adbf72c01b3dd10341c
--- /dev/null
+++ b/params_shard_209.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83fe406cdb9391129d641281edfbc0d28a4c2c1e4806aeb95a22916ed8e490d4
+size 117440512
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b71a8f53bee929d97a1334f449734912a23193bb
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:87948a71f825de125380d6eb890ee62cbea8ebadd5b60c7d5dfdacf95ac1fe5c
+size 234881024
diff --git a/params_shard_210.bin b/params_shard_210.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80a62d23101fb7a9220cdcda3707f3aa58697707
--- /dev/null
+++ b/params_shard_210.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ffc4bb74db3d07033a24cebb27613a0feb5a8c8f7ea668b521014daa28465a0
+size 24150016
diff --git a/params_shard_211.bin b/params_shard_211.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5dd9010406488af04e2ed4d6dd48941336fc58df
--- /dev/null
+++ b/params_shard_211.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6be509dc46b8c4e447cb66e7d44cc150703d2755c10012e5cd06158f4d83eb90
+size 41943040
diff --git a/params_shard_212.bin b/params_shard_212.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aec401afcaa191ee7b989c3f94ec3bfa0e7cb1ba
--- /dev/null
+++ b/params_shard_212.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a6eaf05ec448272c410618c7075b8b98139ef796a5621a501047de7338390e6
+size 33554432
diff --git a/params_shard_213.bin b/params_shard_213.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c5413bb5827b508a403c24d8180baafa16d89392
--- /dev/null
+++ b/params_shard_213.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:93c6b8bbc8f05687422a00b1d877f108829ba841241b25944ef9dcde3c3fd3e1
+size 234881024
diff --git a/params_shard_214.bin b/params_shard_214.bin
new file mode 100644
index 0000000000000000000000000000000000000000..524a7a2751fb81c49cf13196bb8442630db7a9ae
--- /dev/null
+++ b/params_shard_214.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82e92cd52453e1501f160849575ecc2e5bca1a16a5088b33916c7c066b3bcf53
+size 29360128
diff --git a/params_shard_215.bin b/params_shard_215.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4db4aba218aeae22cdbea5ffc9bce20242afdaf2
--- /dev/null
+++ b/params_shard_215.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bd786d3e0cd4705f8b480951114c0b0e0c007f91839e09d8b23eeedb086e722
+size 117440512
diff --git a/params_shard_216.bin b/params_shard_216.bin
new file mode 100644
index 0000000000000000000000000000000000000000..981e0cb85e8448bf2f2939fd6cb3f6f5972bd0ba
--- /dev/null
+++ b/params_shard_216.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:077d82bd2f73d9cef24654fadea66d9e37624fb0c3997bfdc510e89995cf39fe
+size 24150016
diff --git a/params_shard_217.bin b/params_shard_217.bin
new file mode 100644
index 0000000000000000000000000000000000000000..092ceaf98b965cf857a15b510b383458c1778e98
--- /dev/null
+++ b/params_shard_217.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4822b52f8f321d3180731ce1bc3ae80a0d5be0f314ab9e61b48aae80a62212f5
+size 41943040
diff --git a/params_shard_218.bin b/params_shard_218.bin
new file mode 100644
index 0000000000000000000000000000000000000000..145fade0ca8a38172a09a6bfd197d21cfcb8c6e7
--- /dev/null
+++ b/params_shard_218.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3db4b5a582ffb1ee72761c9ba52628aaec93ecad25f6dab199f4a4baa95449fb
+size 33554432
diff --git a/params_shard_219.bin b/params_shard_219.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d74e967c4e9031e2f101721e7985034b5780f1e
--- /dev/null
+++ b/params_shard_219.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a4f3b9f6a8ec0793e6fb17c0a15e838bf3b960c834b680033cb43b2bb28dd4a
+size 234881024
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b1921a8dd70d93609f2d296932ff31d1492f527
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4014681845729e36f2abdcd059aac309b9b4b9af0d28cd21b001e98064223a89
+size 29360128
diff --git a/params_shard_220.bin b/params_shard_220.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8e6c8455b796f8b7b21a6b147f66221e33997fb0
--- /dev/null
+++ b/params_shard_220.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b86360b3aa56dde511ba1a0cfb9b38dd5bad5ed03ff997b38136f73e77f09e5
+size 29360128
diff --git a/params_shard_221.bin b/params_shard_221.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d007f7ce00413db573fbc0e113c6d4b569d7f05
--- /dev/null
+++ b/params_shard_221.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b82b5c4f3d901ea957e6e7fe75ab4dff411d0686b4b1fa85ac8cf424a4e63935
+size 117440512
diff --git a/params_shard_222.bin b/params_shard_222.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e38645297ed78e48d04e5649c264f31a13dedc62
--- /dev/null
+++ b/params_shard_222.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45fed886652159e74959661ffe9def530db8aee5a16e2f952ad1ff0562b4b53b
+size 24150016
diff --git a/params_shard_223.bin b/params_shard_223.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c3eee37dc5e66c6b335ef9b4347fd0be0a4e8a5b
--- /dev/null
+++ b/params_shard_223.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:34e8a8f2aa84943a2f5b18077da41ba7807396ced8e1308db60a026efbeecb02
+size 41943040
diff --git a/params_shard_224.bin b/params_shard_224.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4fb8769bcb19d3a1d45d33e0f79679fcd9fefc7e
--- /dev/null
+++ b/params_shard_224.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:facaf7c205e28545b909201a21204dc419bb323118bf0c5d4eefe5392cd87cbd
+size 33554432
diff --git a/params_shard_225.bin b/params_shard_225.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3ba75ad5a834db640ea2f051cb6fd4a6f7951ed8
--- /dev/null
+++ b/params_shard_225.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cdc10902b590d5d90c73a1f23efcc1f0742981404024d51c611184411429488e
+size 234881024
diff --git a/params_shard_226.bin b/params_shard_226.bin
new file mode 100644
index 0000000000000000000000000000000000000000..494bad9595098dd65300c48b889f32ddf3a3aa12
--- /dev/null
+++ b/params_shard_226.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4c45456d788da48de39c35524a29e0561ab66ae0376cc94dca51ff6fad434ea
+size 29360128
diff --git a/params_shard_227.bin b/params_shard_227.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f501ea8c2f8008e974b420ecaa9d3e96a079f507
--- /dev/null
+++ b/params_shard_227.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:621f190aad8a6409182658848a7f8d91a7e71dc4f74e0c0750a7c9b4ba72ea9d
+size 117440512
diff --git a/params_shard_228.bin b/params_shard_228.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2eafb521d42a590cac596f1537629af006746a94
--- /dev/null
+++ b/params_shard_228.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3f2a7b76bb4e281f151a09bb17a29939ac52a75e94a75432301e67b8815c4a94
+size 24150016
diff --git a/params_shard_229.bin b/params_shard_229.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4fa09fc1c0070adb36f65cac40abd9d833177184
--- /dev/null
+++ b/params_shard_229.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:73c17ba4a35a0fb1982a564d3d746d9b032414b14b6f6804d6faac382c28117d
+size 41943040
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7b9129a354067ca78f6a91711f7426244cb39a05
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5367e6ae65f301a020d2724757a2916516ee9ea9b9d877ae82b11235347b6a54
+size 117440512
diff --git a/params_shard_230.bin b/params_shard_230.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a55ef08f919b824cf7554b464305c3b01522e86
--- /dev/null
+++ b/params_shard_230.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9e14a2665a8c1ecbf20aca253727c94198e81842f5e9cfc0b4dd5de1b1787d8
+size 33554432
diff --git a/params_shard_231.bin b/params_shard_231.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2b1954e0ee77bcce6ff7385194658782e6bf2329
--- /dev/null
+++ b/params_shard_231.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff2d44ca2b13ec3f88682021105b3598f984277a843f6f744773a1462567689b
+size 234881024
diff --git a/params_shard_232.bin b/params_shard_232.bin
new file mode 100644
index 0000000000000000000000000000000000000000..43977367b7c490068450c33b5e34c85e630465e7
--- /dev/null
+++ b/params_shard_232.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e0bf61d1d9b712efd8e8f3a4539126c39206b7fb50f5d79258c0ff1b0364f2a
+size 29360128
diff --git a/params_shard_233.bin b/params_shard_233.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f23de245ded44186e1fd4977aeac3d6489004b2c
--- /dev/null
+++ b/params_shard_233.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b66cb135220da020cb3f82b5fc1226f2f9ed1d2106c3e2e93b9eb0a593a94fac
+size 117440512
diff --git a/params_shard_234.bin b/params_shard_234.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ac006cf16f8954db7bf7aa55e1ba4605f97e8951
--- /dev/null
+++ b/params_shard_234.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d9e4e41fb377a26bd3f6d7ab501f18e635afa738aac9ba2671cd85679cd58435
+size 24150016
diff --git a/params_shard_235.bin b/params_shard_235.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c0154b4e13d9da02bbb178d63e42a6c2f5a4a290
--- /dev/null
+++ b/params_shard_235.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ddb1f3b288273d9bd94c0d20e3487da83b40bc05d3b0a0c9fe0fca3d5e5c446
+size 41943040
diff --git a/params_shard_236.bin b/params_shard_236.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b50e3e1f91a5e8b5f2c7fac5fae9a1a1add750ce
--- /dev/null
+++ b/params_shard_236.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:646b7b3ebdab7b9d91f19c90ef0adb9260444c736b86d99642128b33d8c58850
+size 33554432
diff --git a/params_shard_237.bin b/params_shard_237.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7e8d8ac89e551aa5b95ed6288c11b772b74220dd
--- /dev/null
+++ b/params_shard_237.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c33c75d4df9e41aac48bc92f4a94ddd4e6dac7c8ea5398c1cf842a786d22413
+size 234881024
diff --git a/params_shard_238.bin b/params_shard_238.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7b3505aeba9fd9d3ed438fd58167c2e6b783f914
--- /dev/null
+++ b/params_shard_238.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74d5c6fc72345dbf96c6670c1a19904aec35e748fd5985be09744bc038a55836
+size 29360128
diff --git a/params_shard_239.bin b/params_shard_239.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8670d33c0ec848c98aff175514f1a358164d56c9
--- /dev/null
+++ b/params_shard_239.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e993fb45a4724b451397ef9d17865b56e73320919cf630e4032a92e82b65f3cb
+size 117440512
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e085c5da77b07e0a4dfd9ab647f4a4f40c1c1e4c
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7456c91d396f44388eb3cc28e2812941926ae59d04a36c08e85788499a407a14
+size 24150016
diff --git a/params_shard_240.bin b/params_shard_240.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7a021189686f5cdd66ee6cf41a80ebe2739b25c7
--- /dev/null
+++ b/params_shard_240.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab225967610fa48ca5934eae9b8d9992dfb3db7aad3de2a49c6c576e4ac1bfbe
+size 24150016
diff --git a/params_shard_241.bin b/params_shard_241.bin
new file mode 100644
index 0000000000000000000000000000000000000000..817bef2cb933d0f9007f049895032da5dffa11f4
--- /dev/null
+++ b/params_shard_241.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:830a42c66bea3ff05a0beecf68bc2701c304aab33c6420fc67bb099aeb8aa3bd
+size 41943040
diff --git a/params_shard_242.bin b/params_shard_242.bin
new file mode 100644
index 0000000000000000000000000000000000000000..57c742344ae5cb5c734f77017c5e53600a326124
--- /dev/null
+++ b/params_shard_242.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89681714cf6f7fec82ccad16980a0f6782a04adca1e7b40bbf84ebae089e06fd
+size 33554432
diff --git a/params_shard_243.bin b/params_shard_243.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3499a7a682db24a69b58e8f18d49f0d2dea838d5
--- /dev/null
+++ b/params_shard_243.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04ce4ba516a7dc66e43fff3e159f0ebba130cb70e96cb478f5013e451ffdb6e5
+size 234881024
diff --git a/params_shard_244.bin b/params_shard_244.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6195c7c2241c8032b3c1722674994a393737d238
--- /dev/null
+++ b/params_shard_244.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6a206566cb47b65b2b7e0862a1d0f4a8d594e3b50ea8fb48525b24a5db36af76
+size 29360128
diff --git a/params_shard_245.bin b/params_shard_245.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4dab8bace77e0f51601e99e49ea05f1397e3156
--- /dev/null
+++ b/params_shard_245.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92b674f8ebbc4fd7324bb71e58c1e0f32c034274500f2da4ecddcb76e0e6e924
+size 117440512
diff --git a/params_shard_246.bin b/params_shard_246.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72a4ffeecab6f3688ced0a1a6fa10a3a24c09578
--- /dev/null
+++ b/params_shard_246.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ced51739de7df368df650dfa20323dd3e64c158d34418d109b05ee8be15026a4
+size 24150016
diff --git a/params_shard_247.bin b/params_shard_247.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cb958e931f06b91419db6b91ddc503ab88cb3bd8
--- /dev/null
+++ b/params_shard_247.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7fe2ffa00fc24b68f01dee41aa180e1cef854c24f4722bfbfe30862572fce15
+size 41943040
diff --git a/params_shard_248.bin b/params_shard_248.bin
new file mode 100644
index 0000000000000000000000000000000000000000..39ff670434966edeeddac3594e682cbf062b3b38
--- /dev/null
+++ b/params_shard_248.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f9c029219edc5b5cedf6d28a2adce96b3553afffc7b24e72db5a574e070e4c3
+size 33554432
diff --git a/params_shard_249.bin b/params_shard_249.bin
new file mode 100644
index 0000000000000000000000000000000000000000..61f5a7e34055aa3ba39a62f7f519b197ea97a235
--- /dev/null
+++ b/params_shard_249.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f31277ed709700f2037d30767bfe045ec838037687fc11bc3e12655fe884910
+size 234881024
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ce3c7534b308fc186445adfcc85780414a4dd59
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1b7556519f293b88abaa50bae1fa1bf54d4e427a715223980249e2815d1c4cf
+size 41943040
diff --git a/params_shard_250.bin b/params_shard_250.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a2ece7da1e8586b640f71b1b9599fc7558660a3
--- /dev/null
+++ b/params_shard_250.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:216dd6469039da202233c0c1c6644a1e60438e47724fa856ca47f0f02b79de5d
+size 29360128
diff --git a/params_shard_251.bin b/params_shard_251.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3265d7df4e57fa10a941ac41ce5aa747408d66ae
--- /dev/null
+++ b/params_shard_251.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:623a1d978a7aa963868a6d7d32cf9a1b5c67e77afdd91270ed84303c773bf0cc
+size 117440512
diff --git a/params_shard_252.bin b/params_shard_252.bin
new file mode 100644
index 0000000000000000000000000000000000000000..149a88511eaeef1ba8e443326fa940210d3acb8d
--- /dev/null
+++ b/params_shard_252.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3e344fce2d7cde70440d961ea9dab95fe1ab60e75f3e5a76e21bb9cd0d135b4
+size 24150016
diff --git a/params_shard_253.bin b/params_shard_253.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d220539116e39362e4157f86e3ba6addb3d5a5b7
--- /dev/null
+++ b/params_shard_253.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b93b5b0fdf4ac87c2082ae2f8e739b286ed0febeed7d6a76a011304dff9797ca
+size 41943040
diff --git a/params_shard_254.bin b/params_shard_254.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80debe5d5acff4b62bc62303d831dec473c11cb9
--- /dev/null
+++ b/params_shard_254.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68d5da78e6e5f87cbed6f1051a65039fa28face5e47c9d12ec95d4363da82a76
+size 33554432
diff --git a/params_shard_255.bin b/params_shard_255.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d20945b28cdff7bbfcac97b416c30165ddb2b5dd
--- /dev/null
+++ b/params_shard_255.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8eff6f1a2a829bfe602fab856b17bfa96c259870d69d1363908b15900f32583
+size 234881024
diff --git a/params_shard_256.bin b/params_shard_256.bin
new file mode 100644
index 0000000000000000000000000000000000000000..baeed006cc8ea71e091e52c4f7a61df11b14a11f
--- /dev/null
+++ b/params_shard_256.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30e48c7dec70b83fea076fcbb8f4aedd7eeca79eba043c3fb87947fbf89cbb31
+size 29360128
diff --git a/params_shard_257.bin b/params_shard_257.bin
new file mode 100644
index 0000000000000000000000000000000000000000..173c5a5d13f7a25f88cfcdca269d4fc9a4c6ef58
--- /dev/null
+++ b/params_shard_257.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd635833fea09036f758645d534377021fa1f72f443de0344bb99466826e4385
+size 117440512
diff --git a/params_shard_258.bin b/params_shard_258.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0307b3163611705e5b601b9692d2baaf93b82f78
--- /dev/null
+++ b/params_shard_258.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b9f109dfe184aac9b1974e3db966ea336fb152f1ecf9351de6a5a1a71c18751
+size 24150016
diff --git a/params_shard_259.bin b/params_shard_259.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa9396a988cc8da9791c364fde960c3e345af1b5
--- /dev/null
+++ b/params_shard_259.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e45e0c5fc2e301d4e4c604ef2cb5047d8b1194330ddbdc2ab482631148e2ebe
+size 41943040
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5a91b64a92dff05d1cb3643258c495c79a83be97
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f1c98b0b39cb74b0c52cacb61c2f50414182c3c6ffe857febdb076605abb1dc
+size 33554432
diff --git a/params_shard_260.bin b/params_shard_260.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1553611401bfffd612be90f032d47aa77d264239
--- /dev/null
+++ b/params_shard_260.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:074c8c93c620ab5ee0924866f65f91a355f1e1e1df27c28896b2f065c8c81fa4
+size 33554432
diff --git a/params_shard_261.bin b/params_shard_261.bin
new file mode 100644
index 0000000000000000000000000000000000000000..566da5a70cfda665cf4c0467a15a6b68aea71d36
--- /dev/null
+++ b/params_shard_261.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:055f2d03d8249d33006d171579f8952883ec1574d139885b4705394e9b45a411
+size 234881024
diff --git a/params_shard_262.bin b/params_shard_262.bin
new file mode 100644
index 0000000000000000000000000000000000000000..622c86701ee9c9947339e4424f2455b654860a99
--- /dev/null
+++ b/params_shard_262.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1069bb2061013e050e0f236c738b9881daa4abbcf26cc291020ce27abece8c76
+size 29360128
diff --git a/params_shard_263.bin b/params_shard_263.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f3271d920fe3da32bd0cc00fc1361412514486e8
--- /dev/null
+++ b/params_shard_263.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca666c258e64eb4a9cf606e7b33db4e057fee11445a98ebb6054e25e334d75ff
+size 117440512
diff --git a/params_shard_264.bin b/params_shard_264.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26a1ab488f316220a547e9747403dfdeaa96b716
--- /dev/null
+++ b/params_shard_264.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba01ff1f50aff29287a5e9b70ba397c0b8838ebce97ee5fe0f02341232e13c70
+size 24150016
diff --git a/params_shard_265.bin b/params_shard_265.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dffe1d84d11b86d5dec99c0ec2c62ead9d1a2bcc
--- /dev/null
+++ b/params_shard_265.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b98b1510daffe5ea6130b4cf5dbdb5f71b24f7eb29728b2c46d127d03c7b8643
+size 41943040
diff --git a/params_shard_266.bin b/params_shard_266.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1faf6dd74b5652c810426e12b00d394d327faef3
--- /dev/null
+++ b/params_shard_266.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:261d5298254f9561decef1b6ce4fcfd1da3acc6f61dbd5645e7fa44db9c3df7c
+size 33554432
diff --git a/params_shard_267.bin b/params_shard_267.bin
new file mode 100644
index 0000000000000000000000000000000000000000..95a7740e81af839bdca8128b20f0b1fad34e4d51
--- /dev/null
+++ b/params_shard_267.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8cfbcfea77fa18e255157ca936cfccde476e79301486c577f8726f8683b376f1
+size 234881024
diff --git a/params_shard_268.bin b/params_shard_268.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2419ef3c6c4c6d0827fae2a5af7c3ba1de4e072
--- /dev/null
+++ b/params_shard_268.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:055d80840d486f815040d440e5d05591ade7707e56d11648e8c56c4b0712755d
+size 29360128
diff --git a/params_shard_269.bin b/params_shard_269.bin
new file mode 100644
index 0000000000000000000000000000000000000000..807b35db34e27b187c9ba1a463f43dcdfc3796a3
--- /dev/null
+++ b/params_shard_269.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:549f3ea448eba0b49c880b00ed1df953aaafa75e5679417be49fb59c5dcbdebe
+size 117440512
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c513488f6ab61c3e3cec6b9677fd7d0f677d6216
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0dd8c5e52713f6f7176c4fa9cbb9411371aacf6867c08ebc8bdbc5e23bf7dd7c
+size 234881024
diff --git a/params_shard_270.bin b/params_shard_270.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ec3ded78a699b490ac976183bac56a40deae27b
--- /dev/null
+++ b/params_shard_270.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18f7f2e1f0de3c47959a517126ec66a4e40e2e4007bef5b4050e7929fd491e4e
+size 24150016
diff --git a/params_shard_271.bin b/params_shard_271.bin
new file mode 100644
index 0000000000000000000000000000000000000000..478d3228596d1a761372bcf5d2fdf495120db868
--- /dev/null
+++ b/params_shard_271.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dc9b9b9f2c6d6f343937ce964a6b74d75bb3e1345e401a3f0fad9168d70edb4d
+size 41943040
diff --git a/params_shard_272.bin b/params_shard_272.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a2acebdc3189f46555489d468829cc493a054660
--- /dev/null
+++ b/params_shard_272.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:24163927b5ccb27405538ebb35d5ab6a06b9b71645335ba56f460aadab51f09b
+size 33554432
diff --git a/params_shard_273.bin b/params_shard_273.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d44a71943659200efa7e58150455e043063e5408
--- /dev/null
+++ b/params_shard_273.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c78c214c49d03937a22352ad945f7280106f1d05184becb2ac655a548a59425
+size 234881024
diff --git a/params_shard_274.bin b/params_shard_274.bin
new file mode 100644
index 0000000000000000000000000000000000000000..897fc189a80805799713cce888846e91e977ea74
--- /dev/null
+++ b/params_shard_274.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ac327516d474d220187cc6b5f76436fff9780925242814ffe7d597b64665870
+size 29360128
diff --git a/params_shard_275.bin b/params_shard_275.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6d56aa38fc5aef20473d821d574fef9b789320a
--- /dev/null
+++ b/params_shard_275.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1408ec7cda5336e0b473fc7c3028bba8f534bfac58493eda2e3068b096e787a3
+size 117440512
diff --git a/params_shard_276.bin b/params_shard_276.bin
new file mode 100644
index 0000000000000000000000000000000000000000..04787283b108fc13842071017034b04bb54955c8
--- /dev/null
+++ b/params_shard_276.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:217702ed437857dd89713dd075b363f4d2f2acbd56b7c41f4d03df056482faed
+size 24150016
diff --git a/params_shard_277.bin b/params_shard_277.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53fc93226ff34417bf9c7dcd510d5468f7900707
--- /dev/null
+++ b/params_shard_277.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89a3bf05ab1aefb38c093b7ef38793929e904e62803c114aa6526858a869fe30
+size 41943040
diff --git a/params_shard_278.bin b/params_shard_278.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c8923ce8def6837ad1e9c1bb3f65d0a5463601b3
--- /dev/null
+++ b/params_shard_278.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2b280f841c405e93600f8f743866e741e7d92677388b3a24d823baadd6dd7a6
+size 33554432
diff --git a/params_shard_279.bin b/params_shard_279.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e0bf5452fac191bb3f504ec2be46c1363a3aac1
--- /dev/null
+++ b/params_shard_279.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:722b2736585c6befe58c847668d59dfeade00ff80649f05f10683bf284cf6cdd
+size 234881024
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a825c3651f5a3400214f69cbf5516a1253dadb9
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:404099ae00dee0296cdade9df3e251388585b2676cb9e0917205c758e2c64283
+size 29360128
diff --git a/params_shard_280.bin b/params_shard_280.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a79761db70901d7ac8dbab9da506ebc274599fb
--- /dev/null
+++ b/params_shard_280.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d15c435d62a6bcb882fcfafd117a684eaf2f9134685261b120355d774656f51d
+size 29360128
diff --git a/params_shard_281.bin b/params_shard_281.bin
new file mode 100644
index 0000000000000000000000000000000000000000..77ff78c44d969d71b94be8f3acbdcbf75c875468
--- /dev/null
+++ b/params_shard_281.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:babbb3957a3b8cf28c261b23cddd35b41f86e8b15b0d81ac998d9b08b541ea21
+size 117440512
diff --git a/params_shard_282.bin b/params_shard_282.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00510e2984f18d37a20e19f50b0ee47c916c2d1c
--- /dev/null
+++ b/params_shard_282.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:96aa6b87c29af533fbfd0973c6af9df51051696be92dcfdf1f843aae47f7b2ba
+size 24150016
diff --git a/params_shard_283.bin b/params_shard_283.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc4f28e420c9a0126635cb8f3fb1340e1364a68e
--- /dev/null
+++ b/params_shard_283.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:922eb40703bcc96de65bad469c9a00a0bd86e50f809dff71d18300954affafb5
+size 41943040
diff --git a/params_shard_284.bin b/params_shard_284.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4b578cb7b78f663ee7ad975d4358fa6cc0f60d9
--- /dev/null
+++ b/params_shard_284.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95e27dec93c257d14eadcc6331afca221952485531dcb2455423634a5a79cc72
+size 33554432
diff --git a/params_shard_285.bin b/params_shard_285.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fa0cfcd5fecf3a4a3a5fa44b7b7a689197aa2410
--- /dev/null
+++ b/params_shard_285.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:de7a2396124ab8817fd6a6a63d0f0b857146b1ef0e51327c5e7b306d81cf5602
+size 234881024
diff --git a/params_shard_286.bin b/params_shard_286.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dadd6e2bac3d034087c1cb7c2e23abe88fd6aebb
--- /dev/null
+++ b/params_shard_286.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb6677e451de872b769d076c85d963839a3d182e3963c7bcc1f39e10d9125547
+size 29360128
diff --git a/params_shard_287.bin b/params_shard_287.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f44b3f157ca80903a3a87b56c45b01398be73ef6
--- /dev/null
+++ b/params_shard_287.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86496c10e76d88fb02ead02901e939524060a9df7dca31e76062b6658f1130a4
+size 117440512
diff --git a/params_shard_288.bin b/params_shard_288.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5ff79ef8b07b9d1ef6d7f45b6173d1dc6f0c48d
--- /dev/null
+++ b/params_shard_288.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9494c10bed3993046e8fdb861caac8f023b062d006a3d39921246746a3a5777
+size 24150016
diff --git a/params_shard_289.bin b/params_shard_289.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9fa0c9bfc0b6d4dc025faa62ed603af477f406dc
--- /dev/null
+++ b/params_shard_289.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3afcc3e2e932c9e0834f333747584b320700d26cf451660eeb37385ba7352f4b
+size 41943040
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b136ec3016c6f9fc846ccc153c021cd3030c3bde
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b3f3d8cb97c162481ae19f82aee2acf1910cd849fac1e3227c4fa73ce5031bbc
+size 117440512
diff --git a/params_shard_290.bin b/params_shard_290.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6a528e9859aafa901917938754b902b44db6695
--- /dev/null
+++ b/params_shard_290.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a2398cf8f4bb11f6c786c9a5f3c4b07ae30dd41f79a3a690d7b14c68a55e364
+size 33554432
diff --git a/params_shard_291.bin b/params_shard_291.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a8fd0a8aef544b1b111c9071d3bb712f3f37bb7
--- /dev/null
+++ b/params_shard_291.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7bef11ccf5e1a63e0c633e86b5536453775a282d946114e7ac64fa623436923f
+size 234881024
diff --git a/params_shard_292.bin b/params_shard_292.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19d652fb29e8b1db8f5c6ea6abdf72476b12e89c
--- /dev/null
+++ b/params_shard_292.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3f33db1695b1f7ef6a0e344cad359022e2de509432f387044944447787cfbd8d
+size 29360128
diff --git a/params_shard_293.bin b/params_shard_293.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e3de3222471023804e91945cd7318909d8355fe
--- /dev/null
+++ b/params_shard_293.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef5a1081cb6ded77b65647eb6d805855e93e99ed0e1e4c88b2864e9da988a5e6
+size 117440512
diff --git a/params_shard_294.bin b/params_shard_294.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dba3e698a147b17b0401f176aa7a02e934ad225d
--- /dev/null
+++ b/params_shard_294.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04c58e06bce0732628e142a8413b2b9958c75043d04c38185388112e3425c9be
+size 24150016
diff --git a/params_shard_295.bin b/params_shard_295.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d348252f4654340682a4b4d374c50f6bc466165
--- /dev/null
+++ b/params_shard_295.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f13bc9a862edb373c05009302bd01654c1dc2b2aa96c5363717d4e31830da85
+size 41943040
diff --git a/params_shard_296.bin b/params_shard_296.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc60138d2153885c09cefbec646630997686b3a9
--- /dev/null
+++ b/params_shard_296.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bcda1bdb35e625a256924442dd1f89e9ff20f1067abac2d9f2a0c6ffa78dfcbb
+size 33554432
diff --git a/params_shard_297.bin b/params_shard_297.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b1fde810ced590a11c6c4c667e1968a805258882
--- /dev/null
+++ b/params_shard_297.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1388869e533b6810c449439a03ea8fa44b135455df0271a8d9faff0e8899711a
+size 234881024
diff --git a/params_shard_298.bin b/params_shard_298.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4d2fed33fcbeeb7042929af5d4b1faec39e5a5f
--- /dev/null
+++ b/params_shard_298.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d8420bd4ba5baad6ef337f13671e1bd7d47b96a4148fb7f2404107357a0cf50
+size 29360128
diff --git a/params_shard_299.bin b/params_shard_299.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34f03d541ec3a6ce9aef671dd9958e63eb316e02
--- /dev/null
+++ b/params_shard_299.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e2fca5b266e8db455bf79b46dead8873fe717c1c4e31d58dec47a2dd55a4781
+size 117440512
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd323153fa87f2ef68c421acabc87604da05712b
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c3714c5b6d5db6619f4553c3fcc343b282b56bfc0cac6719dd1b721a37e95a66
+size 33554432
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bb44f049dbca093aa2bbd7528fbccca4369ee8f2
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bff679bc274631e23c9c96fb3502f0803e87e927734fff27c911244a0b6a7623
+size 24150016
diff --git a/params_shard_300.bin b/params_shard_300.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5ea5cdf02803c0d18fe8e72bb9fa78354e7e525
--- /dev/null
+++ b/params_shard_300.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26f7d5a4a9cfa4ae164612f20b3ed91d7a83f1fd81ddc44e2c9496bee8ef1af1
+size 24150016
diff --git a/params_shard_301.bin b/params_shard_301.bin
new file mode 100644
index 0000000000000000000000000000000000000000..83b76e006a3f69c2c4e88677569be6eadc0ff854
--- /dev/null
+++ b/params_shard_301.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:246196f9837ee3e035d88715af9a5958c0cbf87e2750fdaf61d5b549beead644
+size 41943040
diff --git a/params_shard_302.bin b/params_shard_302.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5dc79f4376ff28c6dd2f6161e571d8003b90b009
--- /dev/null
+++ b/params_shard_302.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4493d65019f857135df9accfd79b37416b069463d180b23aa6ac141b8f0194f
+size 33554432
diff --git a/params_shard_303.bin b/params_shard_303.bin
new file mode 100644
index 0000000000000000000000000000000000000000..784440b3a9fce7b7711afa773e4380a48a0c662a
--- /dev/null
+++ b/params_shard_303.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4be01759bbfe3d3b909498f7d807c7e6cd115e6c27285d77fe6183d47ece715a
+size 234881024
diff --git a/params_shard_304.bin b/params_shard_304.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2cd90bc36741f727034bc58cec8fe00a393a010
--- /dev/null
+++ b/params_shard_304.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a34e00cbfa4e59f792f8559fbae72e55b9f6495d5f93adc46769465c360910a1
+size 29360128
diff --git a/params_shard_305.bin b/params_shard_305.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3ccd1cd251e91f64544d7b6d92f1b1df0871fb58
--- /dev/null
+++ b/params_shard_305.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69a10ac6e3578c1fd72e2f95caad2abf727478aafd2fa023f13757f581df3576
+size 117440512
diff --git a/params_shard_306.bin b/params_shard_306.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5d31688bb0aea8026f82004d3be5ba764759d794
--- /dev/null
+++ b/params_shard_306.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ad4aba8139ec01ae241dbe0573fb9128ef4ec0df7b5b4efd4bb03a2ae6d7029e
+size 24150016
diff --git a/params_shard_307.bin b/params_shard_307.bin
new file mode 100644
index 0000000000000000000000000000000000000000..208e64d8313777e87c882d6a934bf7e0b5bf93d1
--- /dev/null
+++ b/params_shard_307.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b423e085b81532b78961110018bc1c6100f79241f93686b7c10b7c0fbda12e4b
+size 41943040
diff --git a/params_shard_308.bin b/params_shard_308.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4887e9c4560005b238eb7d1c030b60e8f63bbe75
--- /dev/null
+++ b/params_shard_308.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4db1ce0df11825a397be9bc5c980c45dcb097e7d6b7747b8fe71c5649259edb9
+size 33554432
diff --git a/params_shard_309.bin b/params_shard_309.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e74ee00828e7b8893a80a8354cca154e75e71572
--- /dev/null
+++ b/params_shard_309.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b259e079ccaff20124b0bb55ccaed9fd359ea9e7a02fc0c000267fa7ccf5b0aa
+size 234881024
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..adb57c2adc8011f98a69beda28bd0b06c199c9e0
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc62a400348b1c1a5de9dc59ca4fa15aa14e8d19e773a82cb9f48958ff43523
+size 41943040
diff --git a/params_shard_310.bin b/params_shard_310.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c8136fab8ddb87e252f30bc6a04bae0e981b712
--- /dev/null
+++ b/params_shard_310.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:588b5301f2390fd1ea494a11a60c22553a437f6bf871f4a8267c349a3899f0d7
+size 29360128
diff --git a/params_shard_311.bin b/params_shard_311.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c559081634fd80719047c239449f865f24dfce88
--- /dev/null
+++ b/params_shard_311.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1a0a141d489a280e271cd7c60c36e895c70dd261d8400b2a0278c15ecf836c8
+size 117440512
diff --git a/params_shard_312.bin b/params_shard_312.bin
new file mode 100644
index 0000000000000000000000000000000000000000..564a5da2edff23bc72dea87626062f642d0a137b
--- /dev/null
+++ b/params_shard_312.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd01c91f331cb79f453f80deb0974e53b810117768feb8c521384cafca8042cc
+size 24150016
diff --git a/params_shard_313.bin b/params_shard_313.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d600e52e97e9a242522af6ad7fd469b0ed0db1e
--- /dev/null
+++ b/params_shard_313.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4c97294505c749e8c1d86f3af92f9e43a9d75493a1892c76d9a40256d98df87
+size 41943040
diff --git a/params_shard_314.bin b/params_shard_314.bin
new file mode 100644
index 0000000000000000000000000000000000000000..85739c0d6b0a00e00d6d0c3f72de8ff1b22a9edb
--- /dev/null
+++ b/params_shard_314.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0dfb43da137c9bd5a6284c19fff3e0f91892298775b7518021400d70bb1d284f
+size 33554432
diff --git a/params_shard_315.bin b/params_shard_315.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bc1b1cde9579f3359a517998b29559b0b32b5dc9
--- /dev/null
+++ b/params_shard_315.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f8a4be3c034bd5f84615f969c5f4110ef3b9be817a23c9e82810fe6d90073c5
+size 234881024
diff --git a/params_shard_316.bin b/params_shard_316.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6f3cbd72aa33e406c7f6bae5fb65f4a798f662a9
--- /dev/null
+++ b/params_shard_316.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fec9651f4e23bf5e7bd7732d922a5f019c68856133bdbb1af3c7cf2ad4a55fce
+size 29360128
diff --git a/params_shard_317.bin b/params_shard_317.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e6fcff34f64a6853973608ec47b90368482f004
--- /dev/null
+++ b/params_shard_317.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:633b69519586c1a0e6478e3302cfa04ec8321d93a6e5f26eb4cb0862b0864973
+size 117440512
diff --git a/params_shard_318.bin b/params_shard_318.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cd95134c839047c43f9f601b597b4a40bb01121d
--- /dev/null
+++ b/params_shard_318.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:faf85ee3b6af2e42b2f646cb5d570ae417b1e706580cd7bd2cd14383f7f731f5
+size 24150016
diff --git a/params_shard_319.bin b/params_shard_319.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1caf3e31fc896878609e5d2f8582ee13a1d125fa
--- /dev/null
+++ b/params_shard_319.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:297b3de458807bd946128dce2b370b0a68fb83ad36dd73d2dbec3be3198e907a
+size 41943040
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c6cb838d3dec910942ebcfc769e7c04f74a5c84f
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce343c12fc18754a3d0d43ff753b35c30cee094388b038dd09612e7ba06f8298
+size 33554432
diff --git a/params_shard_320.bin b/params_shard_320.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6aad2d63c841f864fe0d884dfead494d54ba4c84
--- /dev/null
+++ b/params_shard_320.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3322b13119d808233d196ead7e543be30f0f4e3157b2a60562185be3046b9b0a
+size 33554432
diff --git a/params_shard_321.bin b/params_shard_321.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c6d0a816e705cc5210c8199c1b11909053bdd3d
--- /dev/null
+++ b/params_shard_321.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4798504db2b9869a2b68b37601242d44f506f29e3026f765821345c55031cb71
+size 234881024
diff --git a/params_shard_322.bin b/params_shard_322.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9159f03c7ce475cffb6f540541672a3679b35e09
--- /dev/null
+++ b/params_shard_322.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:869e4c0ef465849c885a5bbaec85dc8d9f6208ddb6686b34ba8a5c349f5fa32e
+size 29360128
diff --git a/params_shard_323.bin b/params_shard_323.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c6cf2caba8651bca847f7fdf759967b01ffffca4
--- /dev/null
+++ b/params_shard_323.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a011dbfab8f3e1c343c855e150e99eba816bf8175f21a6177b4a54ce8350ee71
+size 117440512
diff --git a/params_shard_324.bin b/params_shard_324.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ecc6a60f3067b5590e8600cd427de2ebc61ea300
--- /dev/null
+++ b/params_shard_324.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94b0a21fd9dff68601e4dcb8e520ac263ba28e5991d23a180897728655ba5af7
+size 24150016
diff --git a/params_shard_325.bin b/params_shard_325.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2e740eaedf3c8b1a51d3c7376ae5c9e9d40d005
--- /dev/null
+++ b/params_shard_325.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0dd7991d30af691561e531527bef25212242dc39608315c626427bfe50661d68
+size 41943040
diff --git a/params_shard_326.bin b/params_shard_326.bin
new file mode 100644
index 0000000000000000000000000000000000000000..206376033ed4fd2bde66c1c2fd66cb80d79b0a1c
--- /dev/null
+++ b/params_shard_326.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40a1ad5d9a1dbd430ca3d0c7cea2cc25c37060cdf2dd8ff4ce330cf41e9af8a8
+size 33554432
diff --git a/params_shard_327.bin b/params_shard_327.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2c5cbd439595d4670493281cd3fc033f3547428
--- /dev/null
+++ b/params_shard_327.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6581b386c3b807e6559bad3a5b69dab9b73f57561f00e5ee470cb8b7c3bcc2b4
+size 234881024
diff --git a/params_shard_328.bin b/params_shard_328.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29b752ddbb499eb7762166b5f6c74e61d4014f8b
--- /dev/null
+++ b/params_shard_328.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b057f1a1265397c8d8d2798756b76f807da358625014cb8a8b5e21502cf3172
+size 29360128
diff --git a/params_shard_329.bin b/params_shard_329.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8267ab5e8e631865630aa78c16b8b32dc61475a5
--- /dev/null
+++ b/params_shard_329.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4abd8464cbfb040845c5689a271c483b4b79187dc45471b7efe26ac91e20940b
+size 117440512
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c21c077cca6db51f012a3f1b8420ca2570ed6aa
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fa158645361420c09715d3c80ed5bf855ffe20953869d7f6f0765c7ff237f04f
+size 234881024
diff --git a/params_shard_330.bin b/params_shard_330.bin
new file mode 100644
index 0000000000000000000000000000000000000000..65dc55fe91ad76d9591d091f304ab53f99e362c7
--- /dev/null
+++ b/params_shard_330.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6752b5b3e5ba5999a246f3d1f049e0a3d2eee85ba4782cff3a88c45e8e84865f
+size 24150016
diff --git a/params_shard_331.bin b/params_shard_331.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ca4e9bec80576ebe65733aff85ddfe005450bff
--- /dev/null
+++ b/params_shard_331.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79ed2141c2bf5d4c52178791901e6fd3c14d96b60936264cd7d19b020096e52b
+size 41943040
diff --git a/params_shard_332.bin b/params_shard_332.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3a1962959978188c916d86af88035f3c2d4be6c6
--- /dev/null
+++ b/params_shard_332.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5364cc7638eef1e4a9d4e6b1f035593c8117a1a7af2bf869bc25a933db41b963
+size 33554432
diff --git a/params_shard_333.bin b/params_shard_333.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d09b9635efc347683cd44b0166fc24290b3d19d7
--- /dev/null
+++ b/params_shard_333.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:debea8f1fdfd388ec86d804eb34715c343c904df91995bb5a0e8fc815b7b628a
+size 234881024
diff --git a/params_shard_334.bin b/params_shard_334.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ac087af7742c2a160b6836abcef80b6ec075ca6e
--- /dev/null
+++ b/params_shard_334.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8332647d653f86e763fa94921989b0f230499f93f851a7d2d75e00a54d6a1b76
+size 29360128
diff --git a/params_shard_335.bin b/params_shard_335.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7b7a2a4ee5fdb73db5da3f5443389428d6201f1
--- /dev/null
+++ b/params_shard_335.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6577e8cf3d87936247b09f3847cc237f0364f233dc5974b04e6460ed89265b0b
+size 117440512
diff --git a/params_shard_336.bin b/params_shard_336.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2b1bad3296664f7b631807ba746b0ae7449a2d9a
--- /dev/null
+++ b/params_shard_336.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49bc0296ee29f56e25de654acbd2e7b7b5c950fc78deb588248f2cda6429f8fd
+size 24150016
diff --git a/params_shard_337.bin b/params_shard_337.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92e269dcb7bdf48f3da1da002497dabb77cd805a
--- /dev/null
+++ b/params_shard_337.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:917a9325651ca1d1a157d48520bdb4abf3d14426e0405353c6316eeb8f1c44bc
+size 41943040
diff --git a/params_shard_338.bin b/params_shard_338.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80054721250ff27ca70f395bf6a126d3ce9907fe
--- /dev/null
+++ b/params_shard_338.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:319810e727275fb86f4181b7c773cd97ccfa3e62eed0cf6e82ab215d08024242
+size 33554432
diff --git a/params_shard_339.bin b/params_shard_339.bin
new file mode 100644
index 0000000000000000000000000000000000000000..49c9c3da1d592ef0afe7b6e96ec95353a7f5f221
--- /dev/null
+++ b/params_shard_339.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c441596e8836ebee87fcda5475bc8f2723f66f9197724d35afac16af7967cf7
+size 234881024
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9133d2401c914914c4e387addf1f40a7f0c80ba9
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:276b091e7bc775f02824b981df76295e97b5ac9d1d56aa2c3e9365fea1d05b6c
+size 29360128
diff --git a/params_shard_340.bin b/params_shard_340.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0449082dbe10bd10d35d6a924d16565bb233dd4e
--- /dev/null
+++ b/params_shard_340.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c09bc651200ad2e59f5cafed026dd4b5add767062547905ac447c2c5b2a678b8
+size 29360128
diff --git a/params_shard_341.bin b/params_shard_341.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2db8077db1c06a9ee6dcccde55fa8558d229892
--- /dev/null
+++ b/params_shard_341.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0a9eccbde6a3dfe0dc05de04bd27b7bb46127615c0f31243cc85278bd4ec8f5
+size 117440512
diff --git a/params_shard_342.bin b/params_shard_342.bin
new file mode 100644
index 0000000000000000000000000000000000000000..69f71ca93ae27d31713888c915cd044dadc7218e
--- /dev/null
+++ b/params_shard_342.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:08083ef765160bee0719d2c45bffe99bf753196598a3c6d0b0848700af31cfd6
+size 24150016
diff --git a/params_shard_343.bin b/params_shard_343.bin
new file mode 100644
index 0000000000000000000000000000000000000000..419835b4f0585f3401556eee16b7d142fb64ddf4
--- /dev/null
+++ b/params_shard_343.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d43c56920ae51423a542969a9d49f7dd7eda3c96f2f3262c123f7f89625530a
+size 41943040
diff --git a/params_shard_344.bin b/params_shard_344.bin
new file mode 100644
index 0000000000000000000000000000000000000000..441ae9257695ab891c9503a3462b2377f14e0280
--- /dev/null
+++ b/params_shard_344.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85500aa28cbc93373bce12c84a76a3840ef8e678d3bc0eaae98804e6d9a7522e
+size 33554432
diff --git a/params_shard_345.bin b/params_shard_345.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7a51b7f2dc728fc6b9b6a1fb47d9c04d5de3f065
--- /dev/null
+++ b/params_shard_345.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:91097a9dbeafa34fab6351052725697980aa1620a045eaf46c7f8bd63d35c315
+size 234881024
diff --git a/params_shard_346.bin b/params_shard_346.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79345750306d77441ffb410af1ca8f0143c9fa08
--- /dev/null
+++ b/params_shard_346.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17a399a4376fa6205ed46a5891aa65f790b2c65027ad589059ab2faf61df9078
+size 29360128
diff --git a/params_shard_347.bin b/params_shard_347.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e13ecda9213985566365cf37e0309025f60822b0
--- /dev/null
+++ b/params_shard_347.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae75843d4b3b882c7afc7f38c4c33e472c860a8e7a53acf5a9e08212684e1964
+size 117440512
diff --git a/params_shard_348.bin b/params_shard_348.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc20eacb63f8c2324dcaefea0635ec6000dd5d1a
--- /dev/null
+++ b/params_shard_348.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f6f60cfd2d5c961776e081de26d76233ee5251092d7827b737d64d0cdfdf4ae
+size 24150016
diff --git a/params_shard_349.bin b/params_shard_349.bin
new file mode 100644
index 0000000000000000000000000000000000000000..01866d88fe6861d5c89b6cc8909efc6751c552d8
--- /dev/null
+++ b/params_shard_349.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d45415e2cfb6766afa85d5e6bce2ac7abaff1dc002cd7655e1582bd6c43a226
+size 41943040
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..569918df012695a8d2d85dca5f3e25365f8214b4
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50be1ab1f7b4c7a84a3123cba04c6e23726255705bd83a6db67b797b6211f540
+size 117440512
diff --git a/params_shard_350.bin b/params_shard_350.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3f3b8a6ea3e93b3d805b6f3be62b5cc162d0fa83
--- /dev/null
+++ b/params_shard_350.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c032c6919b11dbb049225e3f9351bad9a3bd67cf3e6c4b6ed5bf0f70c4fa05e6
+size 33554432
diff --git a/params_shard_351.bin b/params_shard_351.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a4acc296ff665b09aaf837ee959c08dadeb303ca
--- /dev/null
+++ b/params_shard_351.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb187de0c4d4ff7df424eec705f534284e8432fdc716e614f8df00cd073c9a23
+size 234881024
diff --git a/params_shard_352.bin b/params_shard_352.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c675614305351fe1578aa783805843f6f35925f9
--- /dev/null
+++ b/params_shard_352.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd438407d5fbb87cbb2b22bf117431552167129e09906ef91d654b03742a9b20
+size 29360128
diff --git a/params_shard_353.bin b/params_shard_353.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8fb43bedf7a7756f595ec01acf4972ee5ec1af4c
--- /dev/null
+++ b/params_shard_353.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:454ad3c1b12a7f088f8e9cea450568f4f5aabe5a29529c7e6bda345a5d248991
+size 117440512
diff --git a/params_shard_354.bin b/params_shard_354.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5393c10ac39d6517ed305bb8cd1d3519567e16e8
--- /dev/null
+++ b/params_shard_354.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d10283cb01e57ab1f8fe8dc0179f841365cf76077020415f619a83e46d711099
+size 24150016
diff --git a/params_shard_355.bin b/params_shard_355.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bdcc913c8057298481e3c522165398cab7b480fa
--- /dev/null
+++ b/params_shard_355.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f474a9f9b3d7db255787fa77c5726fd9fcbf002a10c3c1c321e04f02cbcc09df
+size 41943040
diff --git a/params_shard_356.bin b/params_shard_356.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19eac1c8bc7bce19c58c4e938927459c02179dc4
--- /dev/null
+++ b/params_shard_356.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4a034b78c323138d65c7615e0b9b3a9c8cedae18d3d604ddcb72ddc0a1518ed6
+size 33554432
diff --git a/params_shard_357.bin b/params_shard_357.bin
new file mode 100644
index 0000000000000000000000000000000000000000..63050cc715d70607146c1c86f1f367fb3e90ac89
--- /dev/null
+++ b/params_shard_357.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:841782dbd5aafce033b2795df10d0161d1b0591b50a371c733f30f04ec848994
+size 234881024
diff --git a/params_shard_358.bin b/params_shard_358.bin
new file mode 100644
index 0000000000000000000000000000000000000000..05d5e43a8355c9a06a4804b91d210074624d32c6
--- /dev/null
+++ b/params_shard_358.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90e00a47ac6196202512a46dc33ae1c31025229545b79f7a63fd618b7ca8cac4
+size 29360128
diff --git a/params_shard_359.bin b/params_shard_359.bin
new file mode 100644
index 0000000000000000000000000000000000000000..18de37ee8ca3a7b551193b4b9a3ff6d5a055f66f
--- /dev/null
+++ b/params_shard_359.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57f759ca6ad3630dedb6e6dc3c2e86bf74cc067ba4522ce42e4b36d2b5bc6eaf
+size 117440512
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5324f9103b4a9e81fb7234f0e1d1087f96591684
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d2abaeb78630b1788dff14f61bec96fd0b57ffbb0cf47ef0cf9e79a9c0756e8
+size 24150016
diff --git a/params_shard_360.bin b/params_shard_360.bin
new file mode 100644
index 0000000000000000000000000000000000000000..55eafa7fad316ebcbe963cb71e1b81bb8afad56d
--- /dev/null
+++ b/params_shard_360.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9fd15bbb5fbd32848e12b06d32f76c648f0821a400f5f240c9b7dc1c66f83f09
+size 24150016
diff --git a/params_shard_361.bin b/params_shard_361.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1065c327a2e94927694aa89f143cd88dc432704a
--- /dev/null
+++ b/params_shard_361.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8dd7651a23ff7842d331a0c19b32f3080e3c1467204ebd789edd728f3d9d331b
+size 41943040
diff --git a/params_shard_362.bin b/params_shard_362.bin
new file mode 100644
index 0000000000000000000000000000000000000000..96f73bf854ce26ca94061329e6c980162e5d5f2a
--- /dev/null
+++ b/params_shard_362.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26f68426d1294bec29d1c8848932776eb598bb6f08dbc5b14761040a50f22b91
+size 33554432
diff --git a/params_shard_363.bin b/params_shard_363.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc9a7361cd2598ab2f3537a7882a86f2c9ed2c6e
--- /dev/null
+++ b/params_shard_363.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eef7e0ee8e2976844832d88a417baabcca9ff92ad5654d395bef9f930cae5178
+size 234881024
diff --git a/params_shard_364.bin b/params_shard_364.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b2e53dc34dcad25996bdce6ced85710a0271f47
--- /dev/null
+++ b/params_shard_364.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:575bd3d73828fe31d9bc0c4c597a34268edc0d5f1f7887120069309598ffd495
+size 29360128
diff --git a/params_shard_365.bin b/params_shard_365.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3a59097f4ccb476b4f91f11a110f9c388bab882e
--- /dev/null
+++ b/params_shard_365.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e92df740fcbd8216f66b2bb01066f1cc17c5f3e2edf318069df2baa35a78749
+size 117440512
diff --git a/params_shard_366.bin b/params_shard_366.bin
new file mode 100644
index 0000000000000000000000000000000000000000..addede31ccef182bda51c37ddf318dcca05643d8
--- /dev/null
+++ b/params_shard_366.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80a390a6d5da01761823bfc1b69f1c8e15cfe19824b2e3226de13b9114572173
+size 24150016
diff --git a/params_shard_367.bin b/params_shard_367.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5dd4e527f09e857136179d409870ac22c7918eed
--- /dev/null
+++ b/params_shard_367.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1411f40197bf5fdea3f89ede27ed8a05fe24b4095925f98ecb69680bcf88bb93
+size 41943040
diff --git a/params_shard_368.bin b/params_shard_368.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a44a7e6e8e54f0c6914437f99f1f0e5e09b41ad
--- /dev/null
+++ b/params_shard_368.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:35ddbdd31adf9a6e81d2574131d5d9162e3514dabb260d88f75b88b0cb7c35f5
+size 33554432
diff --git a/params_shard_369.bin b/params_shard_369.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bebb4f0b9314cb47eb8cac04b65c4f2524eb2212
--- /dev/null
+++ b/params_shard_369.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d784376fb223b43423fa5b3a7729149c1a67db3308852294cd21cc5d85c1e0ee
+size 234881024
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b02dceafdd9d90fe5cac4752e9ee6a05fdaa5fc
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:803bfda6aad12d62b038cb1e4930acf5a8c318de728bea8153ec9972d0449a22
+size 41943040
diff --git a/params_shard_370.bin b/params_shard_370.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ba6b516c9762d47edd54a9e40f3c0f544085bfd
--- /dev/null
+++ b/params_shard_370.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4e2b6f15a4b5f5da9f4545c1dd558d8c83aa1c46288ca7951424c6ef07b9661
+size 29360128
diff --git a/params_shard_371.bin b/params_shard_371.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4803ef03b07a971f309d8a0477e41f115f40cfb
--- /dev/null
+++ b/params_shard_371.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0cb87028e685a60ea693d142cb95f60c55f13dddbf859750c42b3e7440010e3
+size 117440512
diff --git a/params_shard_372.bin b/params_shard_372.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7451d858d1804bc1cf8f5c55a229b76d27ccdaa4
--- /dev/null
+++ b/params_shard_372.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62aeabcdc387f55a511f055f6828a13c9d523d844839dd8e227934b5512fe639
+size 24150016
diff --git a/params_shard_373.bin b/params_shard_373.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef753d54763996c2abe6bbd9d55614cfc31a1fce
--- /dev/null
+++ b/params_shard_373.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0d0a457108ce94147d4634a0a2adc47027ccdd68c1aaac09b1d9fb87e8aedcb
+size 41943040
diff --git a/params_shard_374.bin b/params_shard_374.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99117ef3a32810b9954ca4f76dcceaed86d29a9c
--- /dev/null
+++ b/params_shard_374.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:914135a24a2dcddfe71880c24f516d56ffdb89cfb5ea39d465cddb1c9fb5e602
+size 33554432
diff --git a/params_shard_375.bin b/params_shard_375.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a9bbf19faaf3515431b76931894f5db17fe78217
--- /dev/null
+++ b/params_shard_375.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6eab866c1e1bb27f784b2651f6fbcde8e134c00ec9c569f776681222961b0972
+size 234881024
diff --git a/params_shard_376.bin b/params_shard_376.bin
new file mode 100644
index 0000000000000000000000000000000000000000..db9e7ed5c8bd595a4d78831dcf00a824228b541d
--- /dev/null
+++ b/params_shard_376.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8045ba4e4f13b1f23099f3eec96c58b82aa98cb14dd6c49863aa3c3c29a353c2
+size 29360128
diff --git a/params_shard_377.bin b/params_shard_377.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5d1fbca2a57a7d0ea4326d345b801be6e470827c
--- /dev/null
+++ b/params_shard_377.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3fe4b43677fd354ede56868b0a0c4a7e7845e6e6e41c23d749b8b6916405cd63
+size 117440512
diff --git a/params_shard_378.bin b/params_shard_378.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a91c50544e0a3b93783532031d6e19b566992610
--- /dev/null
+++ b/params_shard_378.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6335f1776f6958893c964d4e60eac79e754809e924dbc0d4d754070554ec3200
+size 24150016
diff --git a/params_shard_379.bin b/params_shard_379.bin
new file mode 100644
index 0000000000000000000000000000000000000000..01f501f9e21df4c14c130452033325066126e897
--- /dev/null
+++ b/params_shard_379.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:507c040fc3912f3f765988e7920e7478efe66dc2a01762a9b612f2ce07fecd84
+size 41943040
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ef72931f97b3a509b2a17437847ebce417f9cfe
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:378904da8428c7e74e24e3bcb65150c86a755a28145a14c67596caa3a6404638
+size 33554432
diff --git a/params_shard_380.bin b/params_shard_380.bin
new file mode 100644
index 0000000000000000000000000000000000000000..43c5da34363de19a5f354b952877e4223244b155
--- /dev/null
+++ b/params_shard_380.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8efc769107c8f4e263172984a1e892258b68c00c535eb46d0ef368232fe477df
+size 33554432
diff --git a/params_shard_381.bin b/params_shard_381.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e95a49f92e51c279c46dfd34f97d00584530bf4
--- /dev/null
+++ b/params_shard_381.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bea2e8df7061aba0e54c37af3d86f2c54e9bdd224b9fa5e967a12625eaf7dc08
+size 234881024
diff --git a/params_shard_382.bin b/params_shard_382.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f9d439a08f0b328b6f371235e9611888022ffde8
--- /dev/null
+++ b/params_shard_382.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6c543bbe66fa3f59c15c80a2a340e19de4d0d2d57bcf4b34c079e3989e56b487
+size 29360128
diff --git a/params_shard_383.bin b/params_shard_383.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c1fdcf0bfc59fc0b64c85d08a54fe8b07ceeb7a
--- /dev/null
+++ b/params_shard_383.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e2777e44b69441e53f8090770f5f4283cb5b92fd66d3ca04ec7a5d2a41c410a
+size 117440512
diff --git a/params_shard_384.bin b/params_shard_384.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5fb8771f6902f6b1f9d49d9a5aeb5e28e1d1252f
--- /dev/null
+++ b/params_shard_384.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f85a9b5dae2610c2df1f11714e091c06bca46ff32056d5918ce6861f319773e5
+size 24150016
diff --git a/params_shard_385.bin b/params_shard_385.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c695fb8b8c9754eb0e44d7e2173c2ff9faaffc4
--- /dev/null
+++ b/params_shard_385.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:034b06bc6ca375124e3ecdf5ee9be1792058946bec033692ea8690e04d20b0ae
+size 41943040
diff --git a/params_shard_386.bin b/params_shard_386.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa35bd35613afc0ba77ea95419f58fa5dec18042
--- /dev/null
+++ b/params_shard_386.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0714582d9f6c66ed9be17127fdb34b42acb065d6cfbd79a89dd200d181d23912
+size 33554432
diff --git a/params_shard_387.bin b/params_shard_387.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30cd1b9fbcc51a93733a7e1d6d3a24b7365d8b23
--- /dev/null
+++ b/params_shard_387.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:049ad05c253ea73dbde4d2730ebb169bcc79002e4e9edd467af7e3fb881e0d42
+size 234881024
diff --git a/params_shard_388.bin b/params_shard_388.bin
new file mode 100644
index 0000000000000000000000000000000000000000..24ad178bd10fd912d8df282459da3c0d4d2a130e
--- /dev/null
+++ b/params_shard_388.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:517e99a233dd2e595e12dcbd21e5f607fa39c431d7d731a314ea11a9f25efd1f
+size 29360128
diff --git a/params_shard_389.bin b/params_shard_389.bin
new file mode 100644
index 0000000000000000000000000000000000000000..377c71f38f0e42341746335af593437335fc804f
--- /dev/null
+++ b/params_shard_389.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af11f002d57981b464f82a94db063d65dc1f9f9a03f2297096a35d89be348c63
+size 117440512
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d602a770054e98179775a19196a4478c6badb37f
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a5b69c1fd67b9405a213ac5b08cec187939cf8c5f57f6a0141e9a557cfdca02
+size 234881024
diff --git a/params_shard_390.bin b/params_shard_390.bin
new file mode 100644
index 0000000000000000000000000000000000000000..684264485d4b043f00a1f79ddfed53ee2360456b
--- /dev/null
+++ b/params_shard_390.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8260b3879d3cf067e4a39ac7ffa91988e33eb69136083d77adea92907a21aa9
+size 24150016
diff --git a/params_shard_391.bin b/params_shard_391.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76391555a620aaee4c89adfd9c9529b1ed8d2129
--- /dev/null
+++ b/params_shard_391.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b59b1957d38a59e6952d374675944c50e1bd9d46f4082e6eb1a02360342fc572
+size 41943040
diff --git a/params_shard_392.bin b/params_shard_392.bin
new file mode 100644
index 0000000000000000000000000000000000000000..15e5ae67693d15401e3f5f569d3b28c5ac98b184
--- /dev/null
+++ b/params_shard_392.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e7e8ba96647cc53118cead41c2ad10f20f493142542b1c32d0aed14b5f926e7
+size 33554432
diff --git a/params_shard_393.bin b/params_shard_393.bin
new file mode 100644
index 0000000000000000000000000000000000000000..90955bfb102562884e9722f3581a82b0d4a2d847
--- /dev/null
+++ b/params_shard_393.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:928015aa2a4fe2ff65a312aeb774bc8273151014bb978027fc03233892fbe503
+size 234881024
diff --git a/params_shard_394.bin b/params_shard_394.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1a04fbec6fa61e8d37c6e1ca2f2b17dd1ec05c56
--- /dev/null
+++ b/params_shard_394.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6fc05db3a0aff4fe6531b4cbeb7fca548dc8a56737d34ec9a31f5b8f6c2f7b56
+size 29360128
diff --git a/params_shard_395.bin b/params_shard_395.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54a062c79f908ae0d7664e352f4d633ece19e707
--- /dev/null
+++ b/params_shard_395.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6252aaf28260a8aa0e674673816baf5432960c3c866c4ae1b946df4155d88931
+size 117440512
diff --git a/params_shard_396.bin b/params_shard_396.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29572740f030d7569b8bdc662d1efdb782bde543
--- /dev/null
+++ b/params_shard_396.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c03692c2defb1761ec87375d48c663ef2976765fbaca90f6bd61aaf480b6cf2f
+size 24150016
diff --git a/params_shard_397.bin b/params_shard_397.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec97d2c355350cb936cbd922c753cba4c5a4be50
--- /dev/null
+++ b/params_shard_397.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da53c3b3f3c8e512750909d89cad108624329a492329540fb4acace761d82c53
+size 41943040
diff --git a/params_shard_398.bin b/params_shard_398.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e807d808713b2df4a0e457c5c7dd7fd171518cf2
--- /dev/null
+++ b/params_shard_398.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a6cf613047368d187edb77defb9a09643240ced908b65c0bc13bfbb5f5e0001
+size 33554432
diff --git a/params_shard_399.bin b/params_shard_399.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29bbbb987bee620b220eea703ddab9471ec5c461
--- /dev/null
+++ b/params_shard_399.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:347aa70767ad7430396984efe8391d164212f1827925f73b12b278e1b4ac2665
+size 234881024
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fed40590efcab72775cab6007e8f06b2597d993d
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:deffa73936d753509ef6421d13dcc3faa7006619556a79ef953ef7e32748df53
+size 234881024
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cb25a63ae1b24b97e934f7694d505373747cbfac
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec7eece9cd9fd8c9f9a2c7add24d439c00a05864a7a17af51e296fcd044ae2df
+size 29360128
diff --git a/params_shard_400.bin b/params_shard_400.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7935e834aebe9e8f3a594fee9ae4342e70397a1
--- /dev/null
+++ b/params_shard_400.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:743722be56071d12913e3aa73981146ab43874363e23c02b1d5aaf384eac9770
+size 29360128
diff --git a/params_shard_401.bin b/params_shard_401.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d81c86b03a836cdaf2069219baa76ef61e13b229
--- /dev/null
+++ b/params_shard_401.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3a1b76145d2a4768bce5f1b309b3f27a923e49f70db578d892a9291d26c1fa3
+size 117440512
diff --git a/params_shard_402.bin b/params_shard_402.bin
new file mode 100644
index 0000000000000000000000000000000000000000..42bee846fe6cbfc8f3b79afd4e054283ea05175d
--- /dev/null
+++ b/params_shard_402.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:185c4ebb33076a6d5197c0fdc28443c78c6bf258ff151dad9192c421c02dc46b
+size 24150016
diff --git a/params_shard_403.bin b/params_shard_403.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d464275500662e1561b2c3530e63685dba657907
--- /dev/null
+++ b/params_shard_403.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80169e97e67afca1ee2aa0a43dc6e8a00088f4686fbc259e853c6dd0fcd66b76
+size 41943040
diff --git a/params_shard_404.bin b/params_shard_404.bin
new file mode 100644
index 0000000000000000000000000000000000000000..347a285d312a404e44549eeb2548dfffd4e2b53e
--- /dev/null
+++ b/params_shard_404.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58446ed900087c79d26e59e716d48fd10c87902da0d0395af16bbd7fd35693fe
+size 33554432
diff --git a/params_shard_405.bin b/params_shard_405.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f2499e06e4e707e02805225b03f312110ee3f796
--- /dev/null
+++ b/params_shard_405.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f8889085b21ab1f147be4fd7fba3e651f908a053697c4e54baac4a516948e6c9
+size 234881024
diff --git a/params_shard_406.bin b/params_shard_406.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ea91998802286700736b96402e5b565630a8b1c4
--- /dev/null
+++ b/params_shard_406.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6c0e6812b242129f5a6597b52a7b188dd93a2fcea2d1300e7f2edd6a9d1aa5ee
+size 29360128
diff --git a/params_shard_407.bin b/params_shard_407.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c387b2d34c332ef0ea7a5b02a1a2392fb8d808e
--- /dev/null
+++ b/params_shard_407.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dcbb22748e0f4c2135c3cc422e26a55f0515d15f6e408c45a4d8e18b4a272325
+size 117440512
diff --git a/params_shard_408.bin b/params_shard_408.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a1448bc94274cba4cebc2db9c67832a2e4583a01
--- /dev/null
+++ b/params_shard_408.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57643df047e90d4b963ef812e1b3699fbab2c4a4bd8010c782aab07d26e1d009
+size 24150016
diff --git a/params_shard_409.bin b/params_shard_409.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7357586698181376436a09841061d1cff374830e
--- /dev/null
+++ b/params_shard_409.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0890b03d2abc70d7fdd2c7d6220340e60c45d218fb8b659bdeab5fa96f409403
+size 41943040
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a9a8626ec902f90fd6ef4d2e82f0cd2276497cd5
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49ffb99e377e7606a81e50a30c1ae0e12bbcd77c7d9f226f9a70b27c28617a48
+size 117440512
diff --git a/params_shard_410.bin b/params_shard_410.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cae19d76e9fa2fbf8425450cd36b3acd7459bbf0
--- /dev/null
+++ b/params_shard_410.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0ef2e91d67dd940514ba288778883175d3ad8efb8b8311e98a5fc1f631699f7b
+size 33554432
diff --git a/params_shard_411.bin b/params_shard_411.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af00a480a81fbd10d4374eb67bd58bde516b7b7f
--- /dev/null
+++ b/params_shard_411.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ff3ed26cb92aa383d6defb7d7c86e99fcba4368c405c9f81e8f7ca1db9bfb8d
+size 234881024
diff --git a/params_shard_412.bin b/params_shard_412.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5e8851759af5d2cbf76f77dc36e68f4b733e42ae
--- /dev/null
+++ b/params_shard_412.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e75ff09ce1dadbc0bf8cffe91c4632a9d025c7fc90247eae0089392b9513854
+size 29360128
diff --git a/params_shard_413.bin b/params_shard_413.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2f2f7d9c91f9ab74f7fe8a578adf80b908f7a9f6
--- /dev/null
+++ b/params_shard_413.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:96e6f8878af55e711c57203097206fe917b4a6f7f456f089c5baa1c84b950a45
+size 117440512
diff --git a/params_shard_414.bin b/params_shard_414.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3332afa91b9b3dc9baa76f962d3d02eafcd80d90
--- /dev/null
+++ b/params_shard_414.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d9ada0a0f8f9be880ef4b948f73c16ce2ffc776015a6584746115406f68e9d70
+size 24150016
diff --git a/params_shard_415.bin b/params_shard_415.bin
new file mode 100644
index 0000000000000000000000000000000000000000..abc43183862240de6526eba1375b34b7766a551d
--- /dev/null
+++ b/params_shard_415.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09cad8111ef5b18fcf0d7c5ec9583e7d5ecf60792df179d08dadc480226940a0
+size 41943040
diff --git a/params_shard_416.bin b/params_shard_416.bin
new file mode 100644
index 0000000000000000000000000000000000000000..272eaede1cf99e0e9e449d577d726d5454907755
--- /dev/null
+++ b/params_shard_416.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b61752bf056b393ab56a9e5ad11a402a60981863bc7f134ec5792faa45752a78
+size 33554432
diff --git a/params_shard_417.bin b/params_shard_417.bin
new file mode 100644
index 0000000000000000000000000000000000000000..526046d7c0d826ab100677f0ce8fbd48d547a211
--- /dev/null
+++ b/params_shard_417.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:16def654a03add7fdc711214ab9b3768c587e789322843793f2973af98350c73
+size 234881024
diff --git a/params_shard_418.bin b/params_shard_418.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c896714f9a9cda4b2b0e7c7cc3a3e7a738e13f96
--- /dev/null
+++ b/params_shard_418.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:931cf6e7903e3bc43e8e17ae1f4788243b031283ab7bc77f1264f82749be95c4
+size 29360128
diff --git a/params_shard_419.bin b/params_shard_419.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b02be4d21c03314050276b06d5f1aeda7025fab
--- /dev/null
+++ b/params_shard_419.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f115f10f81850d7efc26f80b460ce982be9c49988fb02775a9268589cfbeac5
+size 117440512
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..22c25724dc6afff43b974c0d4168dab56e00716a
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e19b4038f57d7265e4de14c9748027b7d1398f46178651751aae9f26be25e129
+size 24150016
diff --git a/params_shard_420.bin b/params_shard_420.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e0490a1b7c29763740e3d9ca48dc9d1eec19bb4
--- /dev/null
+++ b/params_shard_420.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab7e6505ee9c6077ede35a065079389c888acdbc125bf2d81b1c92ea9b2f7c64
+size 24150016
diff --git a/params_shard_421.bin b/params_shard_421.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5428ec6b3178983181fb2bd38279476224946ffa
--- /dev/null
+++ b/params_shard_421.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b6af071cc7f32a6517d1526edb359ea4db75f38ba5e20fc1baaf43ad2b357e2
+size 41943040
diff --git a/params_shard_422.bin b/params_shard_422.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2b8e7af9a6488d74fcbd9ae6d843bbe965ff27a
--- /dev/null
+++ b/params_shard_422.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02daa57a998da1cd9d3a9f6d95a066d8bdf9b3274c88cbd3c49b38be16f7e9b9
+size 33554432
diff --git a/params_shard_423.bin b/params_shard_423.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00d022f233fd6796823d29c3de220fa5a1a18e71
--- /dev/null
+++ b/params_shard_423.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf186658a8ddd6b02416127db5ecd476cda3fde0d93dd5832c44b577dc35bc65
+size 234881024
diff --git a/params_shard_424.bin b/params_shard_424.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6d1045a9976b4d4a4996edb40946e18e84a1f6e
--- /dev/null
+++ b/params_shard_424.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:194565a1cc59388ecaf1aab58ae4415cdf31e5986d522631afe3cf2f4d902d8a
+size 29360128
diff --git a/params_shard_425.bin b/params_shard_425.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f039afce60f9a05301a79ed90a7ad7258bcc6133
--- /dev/null
+++ b/params_shard_425.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07a85a41ccb2768a242991da6e8399d83abd5b44c111e835eef892c84930ad61
+size 117440512
diff --git a/params_shard_426.bin b/params_shard_426.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e714043f976072f54e95b98da73f62e754990130
--- /dev/null
+++ b/params_shard_426.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9686ad75bc29a4e52b1fd2dd3ed43075495e1e93c4180b8b00886e227ee38099
+size 24150016
diff --git a/params_shard_427.bin b/params_shard_427.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f3bca45aacd1eaaa5907bbf984f4f82bdea3c84
--- /dev/null
+++ b/params_shard_427.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb6f05535d3ee54ccd1bb1a59e72128b4b50fef1bdf7423c5afb87d20fab132d
+size 41943040
diff --git a/params_shard_428.bin b/params_shard_428.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7ba8bbff7583b86a1fb0e0ed67613121c01564c8
--- /dev/null
+++ b/params_shard_428.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fa2d062f8abf004ca201d348069af85f28ec486950ae9c32d704afead656bc9a
+size 33554432
diff --git a/params_shard_429.bin b/params_shard_429.bin
new file mode 100644
index 0000000000000000000000000000000000000000..796d7110e94f8e7cd235d4d0454767b782b59d38
--- /dev/null
+++ b/params_shard_429.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:42821ae3953492b42c0363501a434ecbae2cddea66437c28d28bb26723100948
+size 234881024
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0206ddc467503e994c4a60f6d0b62dbd7b30ca99
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d49046f664c4bd1b9e86e4407ccfc3fd21305f4f47c7854cd99454ed16f6723
+size 41943040
diff --git a/params_shard_430.bin b/params_shard_430.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cbac77287f81d7e0754d4fbfb179bac1400fee58
--- /dev/null
+++ b/params_shard_430.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:228f67d7a5d5037c2fcc0fece091f4f4fd3d3ccd692928bf6df6bca7320eedca
+size 29360128
diff --git a/params_shard_431.bin b/params_shard_431.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3bc008f624baea7f94241f4fbf79b4a3f25331a9
--- /dev/null
+++ b/params_shard_431.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:71387583d308ea0485485812c5193927c188b16b8af7f480152d737ea590c353
+size 117440512
diff --git a/params_shard_432.bin b/params_shard_432.bin
new file mode 100644
index 0000000000000000000000000000000000000000..93733b22f8dfe0427e202a745a4cc2c56e0a81d8
--- /dev/null
+++ b/params_shard_432.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5cd1c6b8233c123415341178ce95394821172b52cc94f1809673c2f992f19c99
+size 24150016
diff --git a/params_shard_433.bin b/params_shard_433.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4cc090202a291c1b69662e75893ba62a669afe53
--- /dev/null
+++ b/params_shard_433.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1377168a25ae97a8451c94b557a6a7b15f459a206df0c9dbbdb23d78d7e5bed2
+size 41943040
diff --git a/params_shard_434.bin b/params_shard_434.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1956d0c47bb51a0ff628ef78fdc66ec5ead3002e
--- /dev/null
+++ b/params_shard_434.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49773e846c127ac99d5c7b69eae30be9818660d7c1be65728e0187b1dac75a19
+size 33554432
diff --git a/params_shard_435.bin b/params_shard_435.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d3796f64e70a6496f72227a0dadf7f443c73398e
--- /dev/null
+++ b/params_shard_435.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98a5d95715202e1c8456c81e0b2a01dc27addd11e01de2ee9c7337314c91313e
+size 234881024
diff --git a/params_shard_436.bin b/params_shard_436.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e50e8f7c86a4b9fdd71ec80ef52263e5b3c9297e
--- /dev/null
+++ b/params_shard_436.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2fb6681d97e13c320e455c5adda29751298a84c2ca82a48bf0bb4a94839b62de
+size 29360128
diff --git a/params_shard_437.bin b/params_shard_437.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99f2d9cc616a7dde04ab6ed4053c8b890300e507
--- /dev/null
+++ b/params_shard_437.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:31a00e92cd6f4b1e2e59d056507e992d3aa8cc9d4174395b43f76e49301d0340
+size 117440512
diff --git a/params_shard_438.bin b/params_shard_438.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f29894278184e7cf589d66919f18185a0e05c69f
--- /dev/null
+++ b/params_shard_438.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00eb4b6eafaec3ee8e3c1a63b98b747cca9d0dcbecbf4b8b30d4250eba53a8be
+size 24150016
diff --git a/params_shard_439.bin b/params_shard_439.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c8f922bf6d9d03e4f282f3274c6c510886e16e1
--- /dev/null
+++ b/params_shard_439.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c7068eb5f1470fb2c6c501bf8a9df06389dea5d46753c1c0bb3f73d9b110a7a5
+size 41943040
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..62e2d0f5765e9d922cc66f2a7a6086c82f481dc9
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb6fc1f3b055928663e8981fa5b87c66062f01e8920a0ccdd94da4f7eef5e820
+size 33554432
diff --git a/params_shard_440.bin b/params_shard_440.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19a6090da6214b9f30988aeac67a351a403b3e51
--- /dev/null
+++ b/params_shard_440.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d97607765894bdcd78924361790303630e814d341b068f9b1c09b15b595ff26
+size 33554432
diff --git a/params_shard_441.bin b/params_shard_441.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6139dd43af241516484c74e3195123110d508aac
--- /dev/null
+++ b/params_shard_441.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:12806ba2d06d150621dce2324f3b354ef6451ca575f64fe079c019bece67913e
+size 234881024
diff --git a/params_shard_442.bin b/params_shard_442.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e9e9bbf845041997aa3e93b9b90a3fb74a5bb725
--- /dev/null
+++ b/params_shard_442.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c214ae0c90c1cf821c5e05f01e07b3dc59aaaf27120f3f70fe07af100ce538d6
+size 29360128
diff --git a/params_shard_443.bin b/params_shard_443.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bde150628da9cc54b979f280cf54f89e44c34a7c
--- /dev/null
+++ b/params_shard_443.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77246728f6b06028d61b1d92f8776710f8a5fda84fd986770bf27639751c6cce
+size 117440512
diff --git a/params_shard_444.bin b/params_shard_444.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06de4690a5662f6631cf2d9f7a6167d9a718e513
--- /dev/null
+++ b/params_shard_444.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:29b4853e4b6aceb8492e55c0db3378fee5d053462032fe0edf3965bd925b1ef8
+size 24150016
diff --git a/params_shard_445.bin b/params_shard_445.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bbf0d52ae0ede0bb16ea9322a6e25f0c1624b93
--- /dev/null
+++ b/params_shard_445.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:601f14cf8c3b8f95790de812fd25d22b0742774def401dc7a9821fe5dc353ca5
+size 41943040
diff --git a/params_shard_446.bin b/params_shard_446.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7a6d31027d1f4b728b36fd54e7fd8b19613a7a3d
--- /dev/null
+++ b/params_shard_446.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98632f04c76735e382a955f3b0706f6cad0407f5faf54352cfb187a5b9858910
+size 33554432
diff --git a/params_shard_447.bin b/params_shard_447.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58c8daa2c15f646e2172b2cc6f7697b70a5a8ae5
--- /dev/null
+++ b/params_shard_447.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2cf595445e002c76a13e0da01625d355325cbdb562e4f02eeeabbd4e2eb32e06
+size 234881024
diff --git a/params_shard_448.bin b/params_shard_448.bin
new file mode 100644
index 0000000000000000000000000000000000000000..511f67394ca9ad612c7af154d1cff8dcbe0eb184
--- /dev/null
+++ b/params_shard_448.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77ed2984a6dcf6cfdfd0122b2ce21e514a6c3067b4ce3001421ae9a3a7074a92
+size 29360128
diff --git a/params_shard_449.bin b/params_shard_449.bin
new file mode 100644
index 0000000000000000000000000000000000000000..304ceb2b4353dff972b55505df508f3ce6542d81
--- /dev/null
+++ b/params_shard_449.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48c6951694458fd4215eaa7266b07a85ec452a02484ed6a5b570ec8faa6b7bbc
+size 117440512
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d3c027fa480ab24596cc48e3eb9f6f7ba10078e3
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77ad2a8276473b5bdbd052158428fc99b1b59b1f1c4d816328c1e9f84f83b683
+size 234881024
diff --git a/params_shard_450.bin b/params_shard_450.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26826e46b11c949619d1e97338d202cee845602a
--- /dev/null
+++ b/params_shard_450.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1641c510dda4fa01af0a1cc04384b8ed981aa374f372520b65d23c21636ef328
+size 24150016
diff --git a/params_shard_451.bin b/params_shard_451.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c1b77ee49f949ce309da3c3f54e70c3a48fec98
--- /dev/null
+++ b/params_shard_451.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:057dea90376b0805b8e553a9a1e82a704fe307820c10bb57c72c1d01cf063f4a
+size 41943040
diff --git a/params_shard_452.bin b/params_shard_452.bin
new file mode 100644
index 0000000000000000000000000000000000000000..43cbbf2019b77f36e101dc27a5e3274009a2baab
--- /dev/null
+++ b/params_shard_452.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6353b9855fb7a4df2e9d70d37cbd11ae00e8e20881d99c653396bfe16ed7310c
+size 33554432
diff --git a/params_shard_453.bin b/params_shard_453.bin
new file mode 100644
index 0000000000000000000000000000000000000000..076b7f858deb414a2a483f67bf8f8d9fa0a5a756
--- /dev/null
+++ b/params_shard_453.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6395fe2c6359fd3510378a223bc4f3d488c8bbe9df32aefd8912bd9972b39da6
+size 234881024
diff --git a/params_shard_454.bin b/params_shard_454.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3081a674368f97ceaf230719ecc3c44a0faa9c1d
--- /dev/null
+++ b/params_shard_454.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5729e5eacb1be5c9c837e73436a2575e4fb4bf1e2534bebddf1643aeaaaac134
+size 29360128
diff --git a/params_shard_455.bin b/params_shard_455.bin
new file mode 100644
index 0000000000000000000000000000000000000000..888ce5fd9ae3ff9ab1fe24837702235b25907c79
--- /dev/null
+++ b/params_shard_455.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4728afd2a2dbed41039e5c2f03c10abecf86545972a9b686af2c974706c0b2e1
+size 117440512
diff --git a/params_shard_456.bin b/params_shard_456.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9842a469773cfb17da8808ba6f3298e8bcb74549
--- /dev/null
+++ b/params_shard_456.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb3589ca228de5d4b7b99b02d5a7a2f9713620a81a09e08c7682f70f4a65d913
+size 24150016
diff --git a/params_shard_457.bin b/params_shard_457.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d72ea82b07b5e4738ede2f07e87b4d553435bace
--- /dev/null
+++ b/params_shard_457.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:909dd914ed72e14f0215a3b4d960c9af455c90d72e4db60e9c94b0dce3698158
+size 41943040
diff --git a/params_shard_458.bin b/params_shard_458.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3a7fdc296d2cef8c922c9b490babffecdd2a7b11
--- /dev/null
+++ b/params_shard_458.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7775fe240a153ce1ef1fa9ee8db482e33bd300c48f18262a7cc9fcae9057a6e1
+size 33554432
diff --git a/params_shard_459.bin b/params_shard_459.bin
new file mode 100644
index 0000000000000000000000000000000000000000..db6c9472ba97fc566cb2a4cf94c6f9d4ced9caf3
--- /dev/null
+++ b/params_shard_459.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76a0f627bd1fbe631d5f0143692cc0bd0e54120dfda699a822fe6ee1af0ee89f
+size 234881024
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c6c3d7178e1b0c9ab0431b9c6e3f7d87c0715937
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a08374aa0ee7958a33e90beb3468b3ae487a66326d674e092573733fe3f97d3
+size 29360128
diff --git a/params_shard_460.bin b/params_shard_460.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d354c73aa6fbce2756fcf518a0a271afe61f8fd
--- /dev/null
+++ b/params_shard_460.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23bfda2017ca9b4f7f711eb7c4a1572f59fcb4dfb8e3d38ea5ba6906c7dfbdd4
+size 29360128
diff --git a/params_shard_461.bin b/params_shard_461.bin
new file mode 100644
index 0000000000000000000000000000000000000000..455ceda60bf22e8ed44e7a138de48efc10b9ad86
--- /dev/null
+++ b/params_shard_461.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d382b880a319f101dc260464c0f5f54594e0a0fbc9a12e26b32cf2fcdb277925
+size 117440512
diff --git a/params_shard_462.bin b/params_shard_462.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4bcdc9e29fdf8c74ab0068f01dd9eae893e78d15
--- /dev/null
+++ b/params_shard_462.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8cab7f042fc4000f099d6953a051ec538b05c77a4f471b3c961071ae7add234
+size 24150016
diff --git a/params_shard_463.bin b/params_shard_463.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3ff6fe06ba9673755a91e76b43952fbdad83a44f
--- /dev/null
+++ b/params_shard_463.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:93508e27335522bffac75726e3fe6b18f067c327487e9ac985a3d26f77598827
+size 41943040
diff --git a/params_shard_464.bin b/params_shard_464.bin
new file mode 100644
index 0000000000000000000000000000000000000000..66f45a124832836775afeff5041f31771248249f
--- /dev/null
+++ b/params_shard_464.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f8996be155b27e4306457d6437e1d975dcda770bd314768696194930c6ffe5a
+size 33554432
diff --git a/params_shard_465.bin b/params_shard_465.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9c4f66098bd5a0f0cbb7cffc36b4636b880b9687
--- /dev/null
+++ b/params_shard_465.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81d850a7228aca8cdb33b42616a9949acd32c99400c92b0382a3823f08ecfa7d
+size 234881024
diff --git a/params_shard_466.bin b/params_shard_466.bin
new file mode 100644
index 0000000000000000000000000000000000000000..88c325f53caa39b0ea4d6ea6733ae2cbe1f8718f
--- /dev/null
+++ b/params_shard_466.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ef47ee7da88c40d16fa9dbd1e299ff75f28c7200c95c59075731f2eb0872b28
+size 29360128
diff --git a/params_shard_467.bin b/params_shard_467.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a838fa8f99b460482661eeb3c0f40db04830865c
--- /dev/null
+++ b/params_shard_467.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f2dc5c47a6640c148a9283587b66dccfc04a964744a819b1601459305455473
+size 117440512
diff --git a/params_shard_468.bin b/params_shard_468.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1db4894f9d782e831f33bb4ba7c1078f37ae1a24
--- /dev/null
+++ b/params_shard_468.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a6b3ecc1dd31b9c4ce15185b4f744cc5529d8a84543bc246aa8b66ec17e22aea
+size 24150016
diff --git a/params_shard_469.bin b/params_shard_469.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5d7549038bcfe5c38f660fea6e800b4b222a031e
--- /dev/null
+++ b/params_shard_469.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:becd9c0945840b5bd20c925c39e37fff2cc696a64e35f5ad4e784b0392dedec5
+size 41943040
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..17b3ea0deb6953e2fa8a24fdd2814e7a438329e3
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd7d28ff243ee3012f58d49ed587ef6a17778a3ec76be6943a639f09aa2d711e
+size 117440512
diff --git a/params_shard_470.bin b/params_shard_470.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06e52adf62e686651c2e125e6642b32c78b23b97
--- /dev/null
+++ b/params_shard_470.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:021097aa443467cb46de0282b7d9af51317092b1028bf1a8dabe0f0f6dfc7550
+size 33554432
diff --git a/params_shard_471.bin b/params_shard_471.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a184363f8c94ad31aaddd8a474024fd9fbff1e8
--- /dev/null
+++ b/params_shard_471.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9369dfff70fe3a3b11421cb35b09d1df0b6b7760588f473f2c951d6c94f57783
+size 234881024
diff --git a/params_shard_472.bin b/params_shard_472.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00920c43b623cd8047ba49e917a43623e10c5ea4
--- /dev/null
+++ b/params_shard_472.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:937eee3dd99c11ce935ec6676c843e4dd4b17d320d77accaa156a2d04228dfa2
+size 29360128
diff --git a/params_shard_473.bin b/params_shard_473.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26c90694b57702d2cf0bf7846832711d2fef345a
--- /dev/null
+++ b/params_shard_473.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9bfe45d9305a6be8b24dce6dd1154158c0283b16083994578a7405f94f1a1a52
+size 117440512
diff --git a/params_shard_474.bin b/params_shard_474.bin
new file mode 100644
index 0000000000000000000000000000000000000000..549d45709992293ca3244a4174b7c1fbfbea8209
--- /dev/null
+++ b/params_shard_474.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30421c3062d82c4801309057950da74762c1b403af0c6ffec3de680baea9b960
+size 24150016
diff --git a/params_shard_475.bin b/params_shard_475.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f46764ebc95dbb4342d4e20183f040a83e7accab
--- /dev/null
+++ b/params_shard_475.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bab7938283980f6b8946e530385a87b764add81548b9fd588ff0dc8fe9c7a36f
+size 41943040
diff --git a/params_shard_476.bin b/params_shard_476.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b66d13d83bb01d7b6f7428397833e00b9811dc4b
--- /dev/null
+++ b/params_shard_476.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dda36b412621f7f3cc174442ccace674e2ad21d113391fe2c7402001587249fa
+size 33554432
diff --git a/params_shard_477.bin b/params_shard_477.bin
new file mode 100644
index 0000000000000000000000000000000000000000..280aafad9d0c19c0f69998228f40cb1a1fc4caf0
--- /dev/null
+++ b/params_shard_477.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c80d090ea7b43b154bdb9f09205504eff27cbcc42e65c66e1b9ff2e476fd6d67
+size 234881024
diff --git a/params_shard_478.bin b/params_shard_478.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cdb2ee33b982133968e10b09f6d931d44bdc2bc
--- /dev/null
+++ b/params_shard_478.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef244b33da4cf530bb53619a13716dade53ac39342afc43e37e75b33ac57b8ae
+size 29360128
diff --git a/params_shard_479.bin b/params_shard_479.bin
new file mode 100644
index 0000000000000000000000000000000000000000..279dba43068693edba3259bfb543dec0460ad038
--- /dev/null
+++ b/params_shard_479.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:017bd1d13ee3b5dd21ba72319422bf181eb47eec60d9790ad267c4516c4beb2f
+size 117440512
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ebbcda8100926e2f84664fa14a54f98bf8e7ffd
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6907b93dbed5bedad7ba08ce2d4c4ece7fe053a4c827853a008386322f659a72
+size 24150016
diff --git a/params_shard_480.bin b/params_shard_480.bin
new file mode 100644
index 0000000000000000000000000000000000000000..394fd1fe6423d75e7326c1cba6cd59b2d2f75450
--- /dev/null
+++ b/params_shard_480.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e1cc0b55e06bf00aad79bfc2a44dad51226ed0c3b40608c08e3ab8339ef9628
+size 24150016
diff --git a/params_shard_481.bin b/params_shard_481.bin
new file mode 100644
index 0000000000000000000000000000000000000000..205129e3245659cfcc935531217601b39f36a52a
--- /dev/null
+++ b/params_shard_481.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a903481219c440a0f36d84276a1b1534a76addf6a99bce7875d87b82f4bcf3b7
+size 525336576
diff --git a/params_shard_482.bin b/params_shard_482.bin
new file mode 100644
index 0000000000000000000000000000000000000000..31148aa8da02517111030fefa806c0d27a790115
--- /dev/null
+++ b/params_shard_482.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07cf5b3bd1303428dfdd441bd846d16c950d3758f1307c31232c968e83c29a3f
+size 65667072
diff --git a/params_shard_483.bin b/params_shard_483.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9161f85c942adee621836e8ccac0551fd1646a87
--- /dev/null
+++ b/params_shard_483.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ccc2423cd3974ef6915819d6672e4bb6e5b8e085c88d218adbede40d4123816
+size 14729216
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..083ccac9c36af7e8a539b3edd5b5cf06b3e5aa92
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c3f0f6ef334d93204c77430fdebb98bd6f0c26c5ca45a042c8ed8fea890fa13
+size 41943040
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..57bc07dc4bdd9b6944c737644f73304963c76d22
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67d3e14e021a5b2276e0c633eee91a4b9e9b140f66211fa5d24876eb8b9b5583
+size 29360128
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ceb13d03236655976403d4000a087b5fbe4fe5a6
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d748e8a52a76546d4988e94de4838fe0f146c3ec2737e4e49e511fef18ce65d
+size 33554432
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f198680af104d7970311be38f243fb90c686bde
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aadeac5857e6ac5d57a53de417937945b2d4e684212227e5adcc8983f670e43d
+size 234881024
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b749bceba4a351ac02d296e62fd02bcb225da4a
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a69105720fd3658a25d833243671a2f3aa180660958069960a0a4c07f243ba4a
+size 29360128
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00daedbb244ef3a71e1f817eb49f3efad08636d3
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c82cdfc1ba4e4677eaa735c26a3f844032a11bd4bd112e9a40e1f043506eb5f
+size 117440512
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..56a54f88bd9d34751d060059a2c8cfb7562ae4f0
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d186b5b3c945038b06069f605ecf97b1390edebc4527d5aecb6c99058d6cb56
+size 24150016
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d4dc530051ae12af21cb2a2016e1e2e3ac6e421d
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:889f6036ecf00d9c4bdbef7ca8d9336b842c26b8daa30b7752ee1368bf8ce5b4
+size 41943040
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..053ca31f3c4e22246a599f2cb1ccef363cf25ac7
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61f4a51940473525b550ae969cea83c4b9901d65da060a79db1e8119fd414331
+size 33554432
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1577dd0605f059f67b707ca44dff82201ef674ea
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1153a58a106ab3f9f25e1feadba6d47b8b58d20426fe7333198f2e54f7760b33
+size 234881024
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..869c3a5a8dfa2a9512490d87da9e46931c939023
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1d2b0ab48aad0f65ca42a0107ea1a6fa29f206f90cb7967f00497e67d06e6ef
+size 29360128
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b1304c75cfcc1494fcdc2adcf08d02eb8abe555
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b25517842f5828ecd4636a51f937feeb368045c6a6705a245c2423d2b40a842
+size 117440512
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d375507f92aa795a74f38f73287f6a211fb62759
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d322611af2ca2c9acaef6f3d2c02b7efb30ea3df645456d3acef092d7fa8a0c4
+size 117440512
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6f63b5f1f818869f0604a1830b9edd3fb96e1f1a
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b10f26c9c2337ee1ce5a3b289f743fd42b6621964729584445a615c25fdbf824
+size 24150016
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5034c87cef433f2f297aba9bfe5edca249d32c8c
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:114c980ea103c5e58fd2e6277acc4a65f4c901923c9f6013b9f5df14e2e6b91c
+size 41943040
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..918b0b2e677b898666c807c0e0485c8502d6f633
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86825a57b87027f2664a505be23bfcac3018384686d218e9f34978e4d1a86424
+size 33554432
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..801560ad84f66004582e1100581d34a8d5c8ec9d
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28c72845c5d1c353c682bb4612e47f70cef2cf67f0d5d3454de3f64bb7f28fa7
+size 234881024
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d75635ab13d35e74b9072a4f417a47d41265a011
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:719a96093ad97a98473ae49f047aa06a395022d3d34a1521b921e3e2c8f2ca5d
+size 29360128
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a60cb356aba0bc1fe09ebf9720810af1ddedc885
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bc44b874a28a2ebba65cc75fe2efebd485baa407a9b124f761c8af2592e8d936
+size 117440512
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f752b6391fad0c4ea79a9260dbbf903cf9972b95
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edded2858dc69b86acc5d33e3f375c8e04ede68e52248e4443d3bffa09634d97
+size 24150016
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..18bd570f39a313aba7e341985eaebf76259eb753
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af7428d4c1cbe00b4875f6a63e04d74d2eff3638201a83f233d8e53f88806000
+size 41943040
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7925705a1edd5eb51eeec8bada52a72a375a59fc
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0c12458e4d9031fbfc6a2c22ad0b52763b5386273b45c9d01540451e58f11e0
+size 33554432
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5a5b50bb87a8afeb8a4983efabe0ded3fa46ff3f
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b170c742b9954bfe32846776e9d76fa980cedfed85cc3737898615b6d273a1ea
+size 234881024
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8fb2899cfdc154a21fb13c031f33007a64079b4
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a75085aefd4f46886e0933768aafcbeab42589324b10c310e0c03ff57c542b50
+size 41943040
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cd6d299cda872be429160b1057522004d7414ae6
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:896c551f614e5a1a1c2699bac72a6537bfa774a2bda876422fa667a69c8de1e4
+size 29360128
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bb3f57ede6a09a39c1a4b73b86bd8e03973f6175
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1eee2f0230a238d1d28a15d63eddf793ded60e77aae4605608a893b92f4c010b
+size 117440512
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..60669df524e5483678eddf0035095342ef4a3c1e
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6654a3ba434ccd1f4bcc881cbc67b18f21aeaad5d1265a8ff74e0ba257d270c
+size 24150016
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e36a82a04034074438c838aaf8c609cb9acbce53
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:644629e98cc066e5ed4b22d0e78ea7e35532727f8c6010809452ec0a8b61ef7c
+size 41943040
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3027f52513b396063a9c59dda6804bacb32c21e4
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a08dfc92cf12bbbb0c31aca07c3b137c0f365d33634b35725197f84e0ef7062
+size 33554432
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..700204a7a0ea088b8352cd5decdce9f18bf362e0
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7443716e7115eabf72a7cc4fd668ade437df81f44447d98f224afa451bb2133f
+size 234881024
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6672cc1058038d3e23bdcb9069a42990a57380cc
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df096f51c953b5f4e1b2eddb4b0a3a54d9a6cc4d5265dd055517a89e6c144086
+size 29360128
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..451ee9e7fce6d1810c5dc6ddcf4cb36d0b8cbfdd
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0b39703e503efac03a2297d2dc95d8cd0c3d467454a91d0cb9b3f83dfe555586
+size 117440512
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6fd10a46ee4e8842f054f0ca94b1287689b149e
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea304ffbd0a6f8f6558232e353adef8e0b3204882afa5282dd5b4167ecbd619f
+size 24150016
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fe790d8d8ee817aabd411b73d4a937824f9f9322
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e6a1de083c2fdcc627f8f2840c61d16993ad7d150f5b77fa3c333cb151ba7c64
+size 41943040
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ab630734d195c50bdbdcd02c3082e378c73297b2
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d0e6a1eb72fcc4c38d4c0466ef94f5dcb1e054e04646ffcfbea81a1694223b8
+size 33554432
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26ce301e307971743425eceb29f4410574738efd
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d396c5542e510746a9cef675719ebdfa1f263bb92f9f37b0d1b8cdd2996e2d3b
+size 33554432
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f566b02a3f9afdb98446a8c2029d07ffd0837e6
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b111f52531cff83002cd95b5449c52f785e0abbf5fd705d38535f85e7f3b7e5
+size 234881024
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..026662e492f3c3f685ee2908e9fe222a9f17bfa1
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f37c688929ed9a7311a594bc9e24be19a918e1f0771050dda0b561807a242afc
+size 29360128
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34e79f34b3c5b2c62a46312d52e903459d76e562
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c79b6245af195e890ba6816d8abf621aaf4117474361154aa58e0f04646b2b17
+size 117440512
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07f2759510928a27b8f64c7a3c028a2fd7e8e200
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ac39d5f13524aa7be8a002f7de88808ca82e4a76f966700cbed3c316b6071d7
+size 24150016
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c54e403d5c6deaae9622668565a635f192d06df
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f3bcd9a9a0744d154c09816391fb3ecf343f6f1c54e34c498351c0ffb5bc48e
+size 41943040
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3f7097aaee11357f64e8a3afe5554f5f291b70b7
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c35949ba378b41096b6120c7b0c1533992406dbc6d34fb2b727106f2b6b517c
+size 33554432
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7a7d55128c527593b18dd607b6bca919845cc65d
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd4a323c39852a891d784a998f208dee464d0f23e6fbf0b370bafec69cd4a37c
+size 234881024
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f121dd7354afeb4b169f838adb9e9c9e5ce7e369
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:91abff9c2d76bf8f9440f6cbb2f75644c8d703216f1bbd5aec696e8640d1c3d4
+size 29360128
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0b189a694e8fb75d76395d82eab1313cafa6a70f
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:63bc1c27e03301557d04e8a7ef1a76e160de60a879cb0899509efe9f1cb1a792
+size 117440512
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b4b83497d04b43e775d11a859f578d09f746ca8
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9ae1d6dc1aed583a56c4338f13c051ddc65951bd9d02b0bba5a40ba4379921b
+size 29392896
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd26de41ca33f1852d6244e781453d8ec1b73163
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf1c5782295a0d974981113d28d831eb993da47005974dfce00d1ebdad592b15
+size 24150016
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5f45012e66717aa05cda5fadd1cf3f7544b9db84
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18f47aaa353cd55e05d3cdb8de4e63ef63108634772ef87f2a99452fdfe6d19b
+size 41943040
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd51ce8fd1d1cb3eb889af23878a9c8ffd0c864c
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81f38fa2f246e91bc8204bd12d9333003a6b77e1fe1e9cd1cf44a8a47e39f7c5
+size 33554432
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b3773d5bc3d9895c41af4f9328bb2bb7e749e59
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4be8bc70a664d2a497ab77feb5300aeed8d79d0d24057f8b1729145234526b36
+size 234881024
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7337ef4031cb1f38e2a29f06ed0ae4b9da25c4e2
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9981cb251b5dfb52065db9f6bba5f2e0dc32ba94ff5bf4f26cec1d8fd1e6c79
+size 29360128
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..63cad2930923c393fffa2ad711b827a75be2145b
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b79caaf4d894e7c0b08675bb1b5da3fb28cfdfe4caec4b2c99b30487e4f9e4fc
+size 117440512
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..582075f68dea8a5d021f680c20999840f426e1c1
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50aba95cc38249a5bc0b35c4c7fb140778e70016cd45a94fd8ddfdeba507b6b8
+size 24150016
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92192e5684155ae172f47f9dec421894803179d1
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bfb832f7db746596ceba9fb38b06f4f76f4403e61d4a89aa81a7f8b357086e4a
+size 41943040
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..714762c6e21bfe234865e8bbb7cdcd718c0f113f
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b53b93d3a8a32730af385b6fef83d48bf32322244a26d3d2bebd57ac86a9402e
+size 33554432
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..665eb0e551d0fa029d6af1cc13daa8eb0d73ebcb
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c78ef65f11d79a70464057bd37d60a164b04fdbe89ffe7e247c149ac65791125
+size 234881024
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..e9c8e7a2359b81191c8021d0f3c5f28c67f20962
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,410509 @@
+{
+ "version": "1.0",
+ "truncation": null,
+ "padding": null,
+ "added_tokens": [
+ {
+ "id": 128000,
+ "content": "<|begin▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128001,
+ "content": "<|end▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128002,
+ "content": "<|reserved_special_token_0|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128003,
+ "content": "<|reserved_special_token_1|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128004,
+ "content": "<|finetune_right_pad_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128005,
+ "content": "<|reserved_special_token_2|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128006,
+ "content": "<|start_header_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128007,
+ "content": "<|end_header_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128008,
+ "content": "<|eom_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128009,
+ "content": "<|eot_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128010,
+ "content": "<|python_tag|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128011,
+ "content": "<|User|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 128012,
+ "content": "<|Assistant|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 128013,
+ "content": "
&": 5909, + "CON": 5910, + "Ġrepl": 5911, + "Ġregular": 5912, + "Storage": 5913, + "ramework": 5914, + "Ġgoal": 5915, + "Ġtouch": 5916, + ".widget": 5917, + "Ġbuilt": 5918, + "des": 5919, + "Part": 5920, + "(re": 5921, + "Ġworth": 5922, + "hib": 5923, + "game": 5924, + "91": 5925, + "192": 5926, + "Ġв": 5927, + "acion": 5928, + "ĠWhite": 5929, + "(type": 5930, + "(`": 5931, + "81": 5932, + "Ġnatural": 5933, + "Ġinj": 5934, + "Ġcalcul": 5935, + "ĠApril": 5936, + ".List": 5937, + "Ġassociated": 5938, + "ĉSystem": 5939, + "~~": 5940, + "=[": 5941, + "Ġstorage": 5942, + "Ġbytes": 5943, + "Ġtravel": 5944, + "Ġsou": 5945, + "Ġpassed": 5946, + "!=": 5947, + "ascript": 5948, + ".open": 5949, + "Ġgrid": 5950, + "Ġbus": 5951, + "Ġrecogn": 5952, + "Ab": 5953, + "Ġhon": 5954, + "ĠCenter": 5955, + "Ġprec": 5956, + "build": 5957, + "73": 5958, + "HTML": 5959, + "ĠSan": 5960, + "Ġcountries": 5961, + "aled": 5962, + "token": 5963, + "kt": 5964, + "Ġqual": 5965, + "Last": 5966, + "adow": 5967, + "Ġmanufact": 5968, + "idad": 5969, + "jango": 5970, + "Next": 5971, + "xf": 5972, + ".a": 5973, + "Ġporno": 5974, + "ĠPM": 5975, + "erve": 5976, + "iting": 5977, + "_th": 5978, + "ci": 5979, + "=None": 5980, + "gs": 5981, + "Ġlogin": 5982, + "atives": 5983, + "']);Ċ": 5984, + "Äħ": 5985, + "Ġill": 5986, + "IA": 5987, + "children": 5988, + "DO": 5989, + "Ġlevels": 5990, + "Ġ{{": 5991, + "Ġlooks": 5992, + "Ġ\"#": 5993, + "ToString": 5994, + "Ġnecessary": 5995, + "ĠĠĠĊ": 5996, + "cell": 5997, + "Entry": 5998, + "Ġ'#": 5999, + "Ġextrem": 6000, + "Selector": 6001, + "Ġplaceholder": 6002, + "Load": 6003, + "Ġreleased": 6004, + "ORE": 6005, + "Enumer": 6006, + "ĠTV": 6007, + "SET": 6008, + "inq": 6009, + "Press": 6010, + "ĠDepartment": 6011, + "Ġproperties": 6012, + "Ġrespond": 6013, + "Search": 6014, + "ael": 6015, + "Ġrequ": 6016, + "ĠBook": 6017, + "/Ċ": 6018, + "(st": 6019, + "Ġfinancial": 6020, + "icket": 6021, + "_input": 6022, + "Ġthreat": 6023, + "(in": 6024, + "Strip": 6025, + "ìĿ": 6026, + "ção": 6027, + "71": 6028, + "Ġevidence": 6029, + "));": 6030, + "ĠBro": 6031, + "Ġ[];Ċ": 6032, + "Ġou": 6033, + "buf": 6034, + "Script": 6035, + "dat": 6036, + "Ġrule": 6037, + "#import": 6038, + "=\"/": 6039, + "Serial": 6040, + "Ġstarting": 6041, + "[index": 6042, + "ae": 6043, + "Ġcontrib": 6044, + "session": 6045, + "_new": 6046, + "utable": 6047, + "ober": 6048, + "Ġ\"./": 6049, + "Ġlogger": 6050, + "Ġrecently": 6051, + "Ġreturned": 6052, + "ččĊ": 6053, + ")))Ċ": 6054, + "itions": 6055, + "Ġseek": 6056, + "Ġcommunic": 6057, + "Ġ\".": 6058, + "Ġusername": 6059, + "ECT": 6060, + "DS": 6061, + "Ġotherwise": 6062, + "ĠGerman": 6063, + ".aw": 6064, + "Adapter": 6065, + "ixel": 6066, + "Ġsystems": 6067, + "Ġdrop": 6068, + "83": 6069, + "Ġstructure": 6070, + "Ġ$(\"#": 6071, + "encies": 6072, + "anning": 6073, + "ĠLink": 6074, + "ĠResponse": 6075, + "Ġstri": 6076, + "ż": 6077, + "ĠDB": 6078, + "æĹ": 6079, + "android": 6080, + "submit": 6081, + "otion": 6082, + "92": 6083, + "(@": 6084, + ".test": 6085, + "82": 6086, + "ĊĊĊĊĊĊĊĊ": 6087, + "];čĊ": 6088, + "Ġdirectly": 6089, + "Ġ\"%": 6090, + "ris": 6091, + "elta": 6092, + "AIL": 6093, + "){čĊ": 6094, + "mine": 6095, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 6096, + "(k": 6097, + "bon": 6098, + "asic": 6099, + "pite": 6100, + "___": 6101, + "Max": 6102, + "Ġerrors": 6103, + "ĠWhile": 6104, + "Ġarguments": 6105, + "Ġensure": 6106, + "Right": 6107, + "-based": 6108, + "Web": 6109, + "Ġ-=": 6110, + "Ġintrodu": 6111, + "ĠInst": 6112, + "ĠWash": 6113, + "ordin": 6114, + "join": 6115, + "Database": 6116, + "Ġgrad": 6117, + "Ġusually": 6118, + "ITE": 6119, + "Props": 6120, + "?>Ċ": 6121, + "ĠGo": 6122, + "@Override": 6123, + "REF": 6124, + "Ġip": 6125, + "ĠAustral": 6126, + "Ġist": 6127, + "ViewById": 6128, + "Ġserious": 6129, + "Ġcustomer": 6130, + ".prototype": 6131, + "odo": 6132, + "cor": 6133, + "Ġdoor": 6134, + "ĠWITHOUT": 6135, + "Ġplant": 6136, + "Ġbegan": 6137, + "Ġdistance": 6138, + "()).": 6139, + "Ġchance": 6140, + "Ġord": 6141, + "came": 6142, + "pragma": 6143, + "Ġprotect": 6144, + "ragment": 6145, + "ĠNode": 6146, + "ening": 6147, + "Ñĩ": 6148, + "Ġroute": 6149, + "ĠSchool": 6150, + "hi": 6151, + "Ġneighb": 6152, + "After": 6153, + "licit": 6154, + "Ġcontr": 6155, + "Ġprimary": 6156, + "AA": 6157, + ".WriteLine": 6158, + "utils": 6159, + "Ġbi": 6160, + "Red": 6161, + ".Linq": 6162, + ".object": 6163, + "Ġleaders": 6164, + "unities": 6165, + "Ġgun": 6166, + "onth": 6167, + "ĠDev": 6168, + "FILE": 6169, + "Ġcomments": 6170, + "_len": 6171, + "arrow": 6172, + "amount": 6173, + "Range": 6174, + "sert": 6175, + "GridView": 6176, + "Ġupdated": 6177, + "ĠMo": 6178, + "Ġinform": 6179, + "ociety": 6180, + "ala": 6181, + "Access": 6182, + "Ġhab": 6183, + "Ġcreat": 6184, + "_arg": 6185, + "ĠJanuary": 6186, + "ĠDay": 6187, + "\")čĊ": 6188, + "uple": 6189, + "document": 6190, + "gorith": 6191, + "menu": 6192, + "ĠOver": 6193, + "bb": 6194, + ".title": 6195, + "_out": 6196, + "Ġled": 6197, + "uri": 6198, + "Ġ?>": 6199, + "gl": 6200, + "Ġbank": 6201, + "ayment": 6202, + "ĉprintf": 6203, + "MD": 6204, + "Ġsample": 6205, + "Ġhands": 6206, + "ĠVersion": 6207, + "uario": 6208, + "Ġoffers": 6209, + "ityEngine": 6210, + "Ġshape": 6211, + "Ġsleep": 6212, + "_point": 6213, + "Settings": 6214, + "Ġachie": 6215, + "Ġsold": 6216, + "ota": 6217, + ".bind": 6218, + "Am": 6219, + "Ġsafe": 6220, + "Store": 6221, + "Ġshared": 6222, + "Ġpriv": 6223, + "_VAL": 6224, + "Ġsens": 6225, + "){": 6226, + "Ġremember": 6227, + "shared": 6228, + "element": 6229, + "Ġshoot": 6230, + "Vert": 6231, + "cout": 6232, + "Ġenv": 6233, + "_label": 6234, + "Ġ>Ċ": 6235, + "run": 6236, + "Ġscene": 6237, + "(array": 6238, + "device": 6239, + "_title": 6240, + "agon": 6241, + "]čĊ": 6242, + "aby": 6243, + "Ġbecame": 6244, + "boolean": 6245, + "Ġpark": 6246, + "ĠCode": 6247, + "upload": 6248, + "riday": 6249, + "ĠSeptember": 6250, + "Fe": 6251, + "Ġsen": 6252, + "cing": 6253, + "FL": 6254, + "Col": 6255, + "uts": 6256, + "_page": 6257, + "inn": 6258, + "Ġimplied": 6259, + "aling": 6260, + "Ġyourself": 6261, + ".Count": 6262, + "conf": 6263, + "Ġaud": 6264, + "_init": 6265, + ".)": 6266, + "Ġwrote": 6267, + "003": 6268, + "NG": 6269, + ".Error": 6270, + "ä»": 6271, + ".for": 6272, + "Ġequal": 6273, + "ĠRequest": 6274, + "Ġserial": 6275, + "Ġallows": 6276, + "XX": 6277, + "Ġmiddle": 6278, + "chor": 6279, + "195": 6280, + "94": 6281, + "ø": 6282, + "erval": 6283, + ".Column": 6284, + "reading": 6285, + "Ġescort": 6286, + "ĠAugust": 6287, + "Ġquickly": 6288, + "Ġweap": 6289, + "ĠCG": 6290, + "ropri": 6291, + "ho": 6292, + "Ġcop": 6293, + "(struct": 6294, + "ĠBig": 6295, + "Ġvs": 6296, + "Ġfrequ": 6297, + ".Value": 6298, + "Ġactions": 6299, + "Ġproper": 6300, + "Ġinn": 6301, + "Ġobjects": 6302, + "Ġmatrix": 6303, + "avascript": 6304, + "Ġones": 6305, + ".group": 6306, + "Ġgreen": 6307, + "Ġpaint": 6308, + "ools": 6309, + "ycl": 6310, + "encode": 6311, + "olt": 6312, + "comment": 6313, + ".api": 6314, + "Dir": 6315, + "Ġune": 6316, + "izont": 6317, + ".position": 6318, + "Ġdesigned": 6319, + "_val": 6320, + "avi": 6321, + "iring": 6322, + "tab": 6323, + "Ġlayer": 6324, + "Ġviews": 6325, + "Ġreve": 6326, + "rael": 6327, + "ĠON": 6328, + "rics": 6329, + "160": 6330, + "np": 6331, + "Ġcore": 6332, + "());čĊ": 6333, + "Main": 6334, + "Ġexpert": 6335, + "ĉĉčĊ": 6336, + "_en": 6337, + "Ġ/>": 6338, + "utter": 6339, + "IAL": 6340, + "ails": 6341, + "ĠKing": 6342, + "*/ĊĊ": 6343, + "ĠMet": 6344, + "_end": 6345, + "addr": 6346, + "ora": 6347, + "Ġir": 6348, + "Min": 6349, + "Ġsurpr": 6350, + "Ġrepe": 6351, + "Ġdirectory": 6352, + "PUT": 6353, + "-S": 6354, + "Ġelection": 6355, + "haps": 6356, + ".pre": 6357, + "cm": 6358, + "Values": 6359, + "Ġ\"Ċ": 6360, + "column": 6361, + "ivil": 6362, + "Login": 6363, + "inue": 6364, + "93": 6365, + "Ġbeautiful": 6366, + "Ġsecret": 6367, + "(event": 6368, + "Ġchat": 6369, + "ums": 6370, + "Ġorigin": 6371, + "Ġeffects": 6372, + "Ġmanagement": 6373, + "illa": 6374, + "tk": 6375, + "Ġsetting": 6376, + "ĠCour": 6377, + "Ġmassage": 6378, + "ĉend": 6379, + "Ġhappy": 6380, + "Ġfinish": 6381, + "Ġcamera": 6382, + "ĠVer": 6383, + "ĠDemocr": 6384, + "ĠHer": 6385, + "(Q": 6386, + "cons": 6387, + "ita": 6388, + "Ġ'.": 6389, + "{}": 6390, + "ĉC": 6391, + "Ġstuff": 6392, + "194": 6393, + "Ġ:Ċ": 6394, + "ĠAR": 6395, + "Task": 6396, + "hidden": 6397, + "eros": 6398, + "IGN": 6399, + "atio": 6400, + "ĠHealth": 6401, + "olute": 6402, + "Enter": 6403, + "'>": 6404, + "ĠTwitter": 6405, + "ĠCounty": 6406, + "scribe": 6407, + "Ġ=>Ċ": 6408, + "Ġhy": 6409, + "fit": 6410, + "Ġmilitary": 6411, + "Ġsale": 6412, + "required": 6413, + "non": 6414, + "bootstrap": 6415, + "hold": 6416, + "rim": 6417, + "-old": 6418, + "ĠDown": 6419, + "Ġmention": 6420, + "contact": 6421, + "_group": 6422, + "oday": 6423, + "Ġtown": 6424, + "Ġsolution": 6425, + "uate": 6426, + "elling": 6427, + "]->": 6428, + "otes": 6429, + "ental": 6430, + "omen": 6431, + "ospital": 6432, + "ĠSup": 6433, + "_EN": 6434, + "Ġslow": 6435, + "SESSION": 6436, + "Ġblue": 6437, + "ago": 6438, + "Ġlives": 6439, + "Ġ^": 6440, + ".un": 6441, + "inst": 6442, + "enge": 6443, + "Ġcustomers": 6444, + "Ġcast": 6445, + "udget": 6446, + "ï¼ģ": 6447, + "icens": 6448, + "Ġdetermin": 6449, + "Selected": 6450, + "_pl": 6451, + "ueue": 6452, + "Ġdark": 6453, + "//ĊĊ": 6454, + "si": 6455, + "thern": 6456, + "ĠJapan": 6457, + "/w": 6458, + "PU": 6459, + "ĠEast": 6460, + "ovie": 6461, + "Ġpackage": 6462, + "Ġnor": 6463, + "Ġapi": 6464, + "bot": 6465, + "\"];Ċ": 6466, + "_post": 6467, + "ulate": 6468, + "Ġclub": 6469, + "'));Ċ": 6470, + "Ġloop": 6471, + "PIO": 6472, + "ione": 6473, + "shot": 6474, + "Initial": 6475, + "Ġplayed": 6476, + "register": 6477, + "rought": 6478, + "_max": 6479, + "acement": 6480, + "match": 6481, + "raphics": 6482, + "AST": 6483, + "Ġexisting": 6484, + "Ġcomplex": 6485, + "DA": 6486, + ".Ch": 6487, + ".common": 6488, + "mo": 6489, + "Ġ'../../": 6490, + "ito": 6491, + "Ġanalysis": 6492, + "Ġdeliver": 6493, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6494, + "idx": 6495, + "Ãł": 6496, + "ongo": 6497, + "ĠEnglish": 6498, + "Ċ": 10197, + "_default": 10198, + "ĠDatabase": 10199, + "rep": 10200, + "ESS": 10201, + "nergy": 10202, + ".Find": 10203, + "_mask": 10204, + "Ġrise": 10205, + "Ġkernel": 10206, + "::$": 10207, + ".Q": 10208, + "Ġoffering": 10209, + "decl": 10210, + "ĠCS": 10211, + "Ġlisted": 10212, + "Ġmostly": 10213, + "enger": 10214, + "Ġblocks": 10215, + "olo": 10216, + "Ġgoverning": 10217, + "\\F": 10218, + "Ġconcent": 10219, + ".getText": 10220, + "Ġmb": 10221, + "Ġoccurred": 10222, + "Ġchanging": 10223, + "Scene": 10224, + "_CODE": 10225, + "Beh": 10226, + "\"The": 10227, + "Ġtile": 10228, + "ĠAssociation": 10229, + "ĉP": 10230, + "alty": 10231, + "_ad": 10232, + "odies": 10233, + "iated": 10234, + "Ġprepared": 10235, + "possible": 10236, + "Ġmort": 10237, + "TEST": 10238, + "142": 10239, + "Ġignore": 10240, + "Ġcalc": 10241, + "Ġrs": 10242, + "ĠassertEquals": 10243, + "Ġsz": 10244, + "ĠTHIS": 10245, + ".\"Ċ": 10246, + "Ġcanvas": 10247, + "java": 10248, + "Ġdut": 10249, + "VALID": 10250, + ".sql": 10251, + ".input": 10252, + "Ġaux": 10253, + "Sup": 10254, + "Ġartist": 10255, + "Vec": 10256, + "_TIME": 10257, + ".stringify": 10258, + "etween": 10259, + "ĠCategory": 10260, + "Ġ[-": 10261, + "ĠDevExpress": 10262, + "ĠJul": 10263, + "Ġring": 10264, + ".ed": 10265, + "YY": 10266, + "Let": 10267, + "TextField": 10268, + "Ġflat": 10269, + "_print": 10270, + "ĠOTHER": 10271, + "adian": 10272, + "Ġchecked": 10273, + "ele": 10274, + "Align": 10275, + "standing": 10276, + "Ġ[],": 10277, + "Ġlab": 10278, + "ucky": 10279, + "ĠChristmas": 10280, + "(image": 10281, + ".module": 10282, + "Ġlots": 10283, + "Ġslightly": 10284, + "(final": 10285, + "erge": 10286, + "è¿": 10287, + "147": 10288, + "ĠPolice": 10289, + "143": 10290, + "ĠRight": 10291, + "Ġaward": 10292, + "ĠOS": 10293, + "Ġ{}ĊĊ": 10294, + "Ġptr": 10295, + "oves": 10296, + "icated": 10297, + "ем": 10298, + "Ġmanage": 10299, + "oliday": 10300, + "Amount": 10301, + "oolStrip": 10302, + "tbody": 10303, + "Nav": 10304, + "wrap": 10305, + "BB": 10306, + "Ġwatching": 10307, + "arios": 10308, + "Ġoptional": 10309, + "_K": 10310, + "ĠLicensed": 10311, + ".Map": 10312, + "Timer": 10313, + "ĠAP": 10314, + "ĠRev": 10315, + "(o": 10316, + ",c": 10317, + "umin": 10318, + "etailed": 10319, + "ĠHy": 10320, + "Ġblank": 10321, + "agger": 10322, + "ĠSelf": 10323, + "()[": 10324, + ".make": 10325, + "earn": 10326, + "channel": 10327, + ";Ċ": 10342, + "World": 10343, + "Ġpython": 10344, + "Ġlif": 10345, + "Ġtrav": 10346, + "Ġconven": 10347, + "company": 10348, + "ĠClub": 10349, + "138": 10350, + "Ver": 10351, + "Btn": 10352, + "Ġzone": 10353, + "products": 10354, + "ĠEduc": 10355, + "Ġverify": 10356, + "ĠMil": 10357, + "ono": 10358, + "]);ĊĊ": 10359, + "ENCE": 10360, + "Ġpacket": 10361, + "Ġcer": 10362, + "Ġenumer": 10363, + "Ġpars": 10364, + "formed": 10365, + "Ġoccup": 10366, + "tre": 10367, + "Ġexercise": 10368, + "Day": 10369, + "_sum": 10370, + "Ġasking": 10371, + "aption": 10372, + "Ġorders": 10373, + "Ġspending": 10374, + "ĠERR": 10375, + ".Dis": 10376, + "ĠUtil": 10377, + "âĢľI": 10378, + "\\'": 10379, + "?)": 10380, + "/>Ċ": 10381, + "Ġemot": 10382, + "Ġinfluence": 10383, + "ĠAfrica": 10384, + "atters": 10385, + "Ùħ": 10386, + ".session": 10387, + "Ġchief": 10388, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10389, + "Ġtom": 10390, + "cluded": 10391, + "serial": 10392, + "_handler": 10393, + ".Type": 10394, + "aped": 10395, + "Ġpolicies": 10396, + "-ex": 10397, + "-tr": 10398, + "blank": 10399, + "merce": 10400, + "Ġcoverage": 10401, + "Ġrc": 10402, + "_matrix": 10403, + "_box": 10404, + "Ġcharges": 10405, + "ĠBoston": 10406, + "Pe": 10407, + "Ġcircum": 10408, + "Ġfilled": 10409, + "148": 10410, + "Ġnorth": 10411, + "ictureBox": 10412, + "ĉres": 10413, + "è®": 10414, + "Ġtermin": 10415, + "Ġ[âĢ¦": 10416, + "IRECT": 10417, + "Ġber": 10418, + "Ġ\"../../": 10419, + "retch": 10420, + ".code": 10421, + "_col": 10422, + "ĠGovernment": 10423, + "Ġargv": 10424, + "ĠLord": 10425, + "asi": 10426, + "Exec": 10427, + "ĉlet": 10428, + "vertis": 10429, + "Ġdiscussion": 10430, + "enance": 10431, + "outube": 10432, + "typeof": 10433, + "Ġserved": 10434, + "ĠPut": 10435, + "ĉx": 10436, + "Ġsweet": 10437, + "Before": 10438, + "ategy": 10439, + ".of": 10440, + "ĠMaterial": 10441, + "Sort": 10442, + "ONT": 10443, + "igital": 10444, + "Why": 10445, + "Ġsust": 10446, + "Ġç": 10447, + "abet": 10448, + "Ġsegment": 10449, + "Ġ[],Ċ": 10450, + "ĠMuslim": 10451, + "ĠfindViewById": 10452, + "cut": 10453, + "_TEXT": 10454, + "ĠMary": 10455, + "Ġloved": 10456, + "Ġlie": 10457, + "ĠJO": 10458, + "Ġisset": 10459, + "month": 10460, + "Ġprime": 10461, + "ti": 10462, + "ĠCarol": 10463, + "Use": 10464, + "146": 10465, + "ĠPop": 10466, + "ĠSave": 10467, + "Interval": 10468, + "execute": 10469, + "dy": 10470, + "ĠIran": 10471, + "_cont": 10472, + "ĉT": 10473, + "Ġphase": 10474, + "checkbox": 10475, + "week": 10476, + "Ġhide": 10477, + "Ġtil": 10478, + "Ġju": 10479, + "Custom": 10480, + "burg": 10481, + "/M": 10482, + "TON": 10483, + "Ġquant": 10484, + "Ġrub": 10485, + "ixels": 10486, + "Ġinstalled": 10487, + "Ġdump": 10488, + "Ġproperly": 10489, + "(List": 10490, + "Ġdecide": 10491, + "apply": 10492, + "Has": 10493, + "Ġkeeping": 10494, + "Ġcitizens": 10495, + "Ġjoint": 10496, + "pool": 10497, + "Socket": 10498, + "_op": 10499, + "Ġweapon": 10500, + "gnore": 10501, + "ĠExec": 10502, + "otten": 10503, + "ĠMS": 10504, + "Ġ(-": 10505, + "ĠReview": 10506, + "Ġexamples": 10507, + "Ġtight": 10508, + "!(": 10509, + "DP": 10510, + "ĠMessageBox": 10511, + "Ġphotograph": 10512, + "164": 10513, + "URI": 10514, + "ét": 10515, + "low": 10516, + "ĠGrand": 10517, + ".persistence": 10518, + "Ġmaintain": 10519, + "Ġnums": 10520, + "Ġzip": 10521, + "ials": 10522, + "ĠGets": 10523, + "peg": 10524, + "ĠBuffer": 10525, + "~~~~": 10526, + "rastructure": 10527, + "ĠPL": 10528, + "uen": 10529, + "obby": 10530, + "sizeof": 10531, + "Ġpic": 10532, + "Ġseed": 10533, + "Ġexperienced": 10534, + "Ġodd": 10535, + "Ġkick": 10536, + "Ġprocedure": 10537, + "avigator": 10538, + "-on": 10539, + ",j": 10540, + "ĠAlthough": 10541, + "ĠuserId": 10542, + "accept": 10543, + "Blue": 10544, + "IColor": 10545, + "layer": 10546, + "available": 10547, + "Ġends": 10548, + ".table": 10549, + "Ġdataset": 10550, + "bus": 10551, + "Ġexplain": 10552, + "(pro": 10553, + "ĠCommittee": 10554, + "Ġnoted": 10555, + "]:Ċ": 10556, + "Dim": 10557, + "stdio": 10558, + "154": 10559, + ".\",Ċ": 10560, + "_source": 10561, + "181": 10562, + "ĠWeek": 10563, + "ĠEdge": 10564, + "Ġoperating": 10565, + "Ġeste": 10566, + "ipl": 10567, + "330": 10568, + "agination": 10569, + "Ġproceed": 10570, + "Ġanimation": 10571, + ".Models": 10572, + "ĠWatch": 10573, + "iat": 10574, + "Ġoppon": 10575, + "/A": 10576, + "Report": 10577, + "Ġsounds": 10578, + "_buf": 10579, + "IELD": 10580, + "Ġbund": 10581, + "ĉget": 10582, + ".pr": 10583, + "(tmp": 10584, + "Ġkid": 10585, + ">ĊĊĊ": 10586, + "Ġyang": 10587, + "NotFound": 10588, + "ÑĨ": 10589, + "math": 10590, + "@gmail": 10591, + "ĠLIMIT": 10592, + "redients": 10593, + "Ġvent": 10594, + "avigate": 10595, + "Look": 10596, + "Ġreligious": 10597, + "Ġrand": 10598, + "rio": 10599, + "(GL": 10600, + "_ip": 10601, + "uan": 10602, + "iciency": 10603, + "ĠChange": 10604, + ">čĊčĊ": 10605, + "ĠEntity": 10606, + "Ġrencontre": 10607, + "ĠRet": 10608, + "plan": 10609, + "én": 10610, + "BOOL": 10611, + "uries": 10612, + "train": 10613, + "Definition": 10614, + "============": 10615, + "zz": 10616, + "450": 10617, + "Animation": 10618, + "ĠOK": 10619, + "_menu": 10620, + ".bl": 10621, + "_score": 10622, + "Ġacad": 10623, + "(System": 10624, + "Ġrefresh": 10625, + "'=>$": 10626, + ".Graphics": 10627, + "amento": 10628, + "pid": 10629, + "tc": 10630, + "Ġtips": 10631, + "Ġhomes": 10632, + "Ġfuel": 10633, + "âĸ": 10634, + "_helper": 10635, + "ĠĠčĊ": 10636, + "ĠRoom": 10637, + ".Close": 10638, + "_attr": 10639, + "ĠMount": 10640, + "ĠEv": 10641, + "arser": 10642, + "_top": 10643, + "eah": 10644, + "ĠDelete": 10645, + "ãĢį": 10646, + "uke": 10647, + "Ġusage": 10648, + "aria": 10649, + "_dev": 10650, + "Ġtexture": 10651, + "Ġconversation": 10652, + "eper": 10653, + "Bean": 10654, + "done": 10655, + "nonatomic": 10656, + "ĠSecond": 10657, + "Ġshooting": 10658, + "_pre": 10659, + "Components": 10660, + "Ġ]ĊĊ": 10661, + "__,": 10662, + "stitution": 10663, + ".Char": 10664, + ">();ĊĊ": 10665, + "Ġpresented": 10666, + "Ġwa": 10667, + "oker": 10668, + "-ĊĊ": 10669, + "iner": 10670, + "Ġbecoming": 10671, + "Ġincident": 10672, + "Att": 10673, + "162": 10674, + "Ġrevealed": 10675, + "forc": 10676, + "Ġboot": 10677, + ".page": 10678, + "Enumerator": 10679, + "165": 10680, + "_->": 10681, + "Photo": 10682, + "Ġspring": 10683, + ".\",": 10684, + "ĠDictionary": 10685, + "BJECT": 10686, + "Ġlocations": 10687, + "Ġsamples": 10688, + "InputStream": 10689, + "ĠBrown": 10690, + "Ġstats": 10691, + "quality": 10692, + "Ñħ": 10693, + "-dis": 10694, + "Ġhelping": 10695, + "Ġped": 10696, + "224": 10697, + "(se": 10698, + "ĠWho": 10699, + "alian": 10700, + "internal": 10701, + "Ġft": 10702, + ">().": 10703, + "->{": 10704, + "Ġmine": 10705, + "Ġsector": 10706, + "Ġgro": 10707, + "Ġopportunities": 10708, + "Ġü": 10709, + "Ġmp": 10710, + "Ġalleged": 10711, + "Ġdoubt": 10712, + "Mouse": 10713, + "About": 10714, + "_part": 10715, + "Ġchair": 10716, + "Ġstopped": 10717, + "161": 10718, + "loop": 10719, + "entities": 10720, + "Ġapps": 10721, + "ansion": 10722, + "Ġmental": 10723, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10724, + "FR": 10725, + "Ġdefend": 10726, + "care": 10727, + "Ġideal": 10728, + "/api": 10729, + "urface": 10730, + "011": 10731, + "Ġele": 10732, + "ulator": 10733, + "ĠRights": 10734, + "anguages": 10735, + "Ġfunds": 10736, + "Ġadapt": 10737, + "Attributes": 10738, + "Ġdeploy": 10739, + "opts": 10740, + "Ġvalidation": 10741, + "Ġconcerns": 10742, + "uce": 10743, + ".num": 10744, + "ulture": 10745, + "ila": 10746, + "Ġcup": 10747, + "Ġpure": 10748, + ".Fore": 10749, + "183": 10750, + "ĠHashMap": 10751, + ".valueOf": 10752, + "asm": 10753, + "MO": 10754, + "Ġcs": 10755, + "Ġstores": 10756, + "Ġ************************************************************************": 10757, + "Ġcommunication": 10758, + "mem": 10759, + ".EventHandler": 10760, + ".Status": 10761, + "_right": 10762, + ".setOn": 10763, + "Sheet": 10764, + "Ġidentify": 10765, + "enerated": 10766, + "ordered": 10767, + "Ġ\"[": 10768, + "Ġswe": 10769, + "Condition": 10770, + "ĠAccording": 10771, + "Ġprepare": 10772, + "Ġrob": 10773, + "Pool": 10774, + "Ġsport": 10775, + "rv": 10776, + "ĠRouter": 10777, + "Ġalternative": 10778, + "([]": 10779, + "ĠChicago": 10780, + "ipher": 10781, + "ische": 10782, + "ĠDirector": 10783, + "kl": 10784, + "ĠWil": 10785, + "keys": 10786, + "Ġmysql": 10787, + "Ġwelcome": 10788, + "king": 10789, + "ĠManager": 10790, + "Ġcaught": 10791, + ")}Ċ": 10792, + "Score": 10793, + "_PR": 10794, + "Ġsurvey": 10795, + "hab": 10796, + "Headers": 10797, + "ADER": 10798, + "Ġdecor": 10799, + "Ġturns": 10800, + "Ġradius": 10801, + "errupt": 10802, + "Cor": 10803, + "Ġmel": 10804, + "Ġintr": 10805, + "(q": 10806, + "ĠAC": 10807, + "amos": 10808, + "MAX": 10809, + "ĠGrid": 10810, + "ĠJesus": 10811, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10812, + ".DE": 10813, + "Ġts": 10814, + "Ġlinked": 10815, + "free": 10816, + "ĠQt": 10817, + "Ġ/**čĊ": 10818, + "Ġfaster": 10819, + "ctr": 10820, + "_J": 10821, + "DT": 10822, + ".Check": 10823, + "Ġcombination": 10824, + "Ġintended": 10825, + "-the": 10826, + "-type": 10827, + "182": 10828, + "ectors": 10829, + "ami": 10830, + "uting": 10831, + "Ġuma": 10832, + "XML": 10833, + "UCT": 10834, + "Ap": 10835, + "ĠRandom": 10836, + "Ġran": 10837, + ".sort": 10838, + "Ġsorted": 10839, + ".Un": 10840, + "401": 10841, + "_PER": 10842, + "itory": 10843, + "Ġpriority": 10844, + "ĠGal": 10845, + "ĠOld": 10846, + "hot": 10847, + "ĠDisplay": 10848, + "(sub": 10849, + "_TH": 10850, + "_Y": 10851, + "ĠCare": 10852, + "loading": 10853, + "Kind": 10854, + "_handle": 10855, + ",,": 10856, + "rase": 10857, + "_replace": 10858, + ".addEventListener": 10859, + "ĠRT": 10860, + "172": 10861, + "Ġentered": 10862, + "gers": 10863, + "Ġich": 10864, + "(start": 10865, + "205": 10866, + "/app": 10867, + "Ġbrother": 10868, + "Memory": 10869, + "Outlet": 10870, + "Ġutf": 10871, + "prec": 10872, + "Ġnavigation": 10873, + "ORK": 10874, + "Ġdst": 10875, + "Detail": 10876, + "Ġaudience": 10877, + "Ġdur": 10878, + "Ġcluster": 10879, + "unched": 10880, + "Ġ],": 10881, + "Ġcomfortable": 10882, + ".values": 10883, + "ĠTotal": 10884, + "Ġsnap": 10885, + "Ġstandards": 10886, + "Ġperformed": 10887, + "hand": 10888, + "(\"@": 10889, + "åŃ": 10890, + "Ġphil": 10891, + "ibr": 10892, + "trim": 10893, + "Ġforget": 10894, + "157": 10895, + "Ġdoctor": 10896, + ".TextBox": 10897, + "377": 10898, + "icons": 10899, + ",s": 10900, + "ĠOp": 10901, + "Sm": 10902, + "Stop": 10903, + "ĉList": 10904, + "ĉu": 10905, + "Comment": 10906, + "_VERSION": 10907, + ".Xtra": 10908, + "Person": 10909, + "rb": 10910, + "LOB": 10911, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10912, + "ĠCentral": 10913, + "270": 10914, + "ICK": 10915, + "raq": 10916, + "Ġputting": 10917, + "Ġmd": 10918, + "ĠLove": 10919, + "Program": 10920, + "Border": 10921, + "oor": 10922, + "Ġallowing": 10923, + "after": 10924, + "Ġentries": 10925, + "ĠMaybe": 10926, + "]).": 10927, + "ĠShort": 10928, + ")\\": 10929, + ".now": 10930, + "friend": 10931, + "Ġprefer": 10932, + "ĠGPIO": 10933, + "osis": 10934, + "ĠGameObject": 10935, + "Ġskip": 10936, + "Ġcompetition": 10937, + "_match": 10938, + "lications": 10939, + "_CONT": 10940, + ".groupBox": 10941, + "Ġals": 10942, + "666": 10943, + "\"We": 10944, + "_eq": 10945, + "lan": 10946, + "_search": 10947, + "ĠMusic": 10948, + "asis": 10949, + "Ġbind": 10950, + "ĠIsland": 10951, + "rum": 10952, + "(E": 10953, + "Ġseat": 10954, + "Video": 10955, + "Ġack": 10956, + "reek": 10957, + "={()": 10958, + "Ġrating": 10959, + "Ġrestaurant": 10960, + "456": 10961, + "DEX": 10962, + "(buf": 10963, + "pping": 10964, + "uality": 10965, + "Ġleague": 10966, + "176": 10967, + "Ġfocused": 10968, + "apon": 10969, + "$data": 10970, + "CLUD": 10971, + "CLUDING": 10972, + "Ġabsolute": 10973, + "(query": 10974, + "Ġtells": 10975, + "Ang": 10976, + "Ġcommunities": 10977, + "Ġhonest": 10978, + "oking": 10979, + "Ġapart": 10980, + "arity": 10981, + "/$": 10982, + "_module": 10983, + "ĠEnc": 10984, + ".an": 10985, + ".Config": 10986, + "Cre": 10987, + "Ġshock": 10988, + "ĠArab": 10989, + "IENT": 10990, + "/re": 10991, + "Ġretrie": 10992, + "ycler": 10993, + "isa": 10994, + "ĠOrgan": 10995, + ".graph": 10996, + "Ġí": 10997, + "ĠBAS": 10998, + "Enum": 10999, + "Ġpossibly": 11000, + "ÑĢаÐ": 11001, + "ĠJapanese": 11002, + "Ġcraft": 11003, + "ĠPlace": 11004, + "Ġtalent": 11005, + "Ġfunding": 11006, + "Ġconfirmed": 11007, + "Ġcycle": 11008, + "/x": 11009, + "GE": 11010, + "Ġhearing": 11011, + "Ġplants": 11012, + "Ġmouth": 11013, + "pages": 11014, + "oria": 11015, + "ĠRemove": 11016, + "_total": 11017, + "Ġod": 11018, + "ollapse": 11019, + "door": 11020, + "Ġbought": 11021, + "Ġaddr": 11022, + "ARCH": 11023, + "_dim": 11024, + "dden": 11025, + "Ġdecades": 11026, + "REQUEST": 11027, + "Ġversions": 11028, + "fire": 11029, + "006": 11030, + "Ġmoves": 11031, + "fb": 11032, + "Ġcoffee": 11033, + ".connect": 11034, + "ĠRow": 11035, + "Ġschema": 11036, + "Scope": 11037, + "-Type": 11038, + "Ġfighting": 11039, + "Ġretail": 11040, + "Ġmodified": 11041, + "TF": 11042, + "Files": 11043, + "nie": 11044, + "_command": 11045, + "stone": 11046, + "ĠÑĤ": 11047, + "_thread": 11048, + "Ġbond": 11049, + "ĠDevelopment": 11050, + "Ġpt": 11051, + "FORM": 11052, + "plet": 11053, + "Ġidentified": 11054, + "cpp": 11055, + "206": 11056, + "225": 11057, + "Ġcoding": 11058, + "oked": 11059, + "ĠMaster": 11060, + "IDTH": 11061, + "Ġresidents": 11062, + "redit": 11063, + "ĠPhoto": 11064, + "=-": 11065, + "unte": 11066, + "ateur": 11067, + "159": 11068, + "_STATE": 11069, + "ĠSing": 11070, + "Ġsheet": 11071, + ".val": 11072, + "orse": 11073, + "Ġhers": 11074, + "Ġdetermined": 11075, + "Common": 11076, + "Ġwed": 11077, + "_queue": 11078, + "PH": 11079, + "ĠAtl": 11080, + "cred": 11081, + "/LICENSE": 11082, + "Ġmes": 11083, + "Ġadvanced": 11084, + ".java": 11085, + ".Sh": 11086, + "Go": 11087, + "kill": 11088, + "fp": 11089, + "_settings": 11090, + "Ġpal": 11091, + "Ġtruck": 11092, + "Ġcombined": 11093, + "Ġ\"${": 11094, + "ĠCorpor": 11095, + "Ġjoined": 11096, + "ĠJose": 11097, + "ĠCup": 11098, + "uns": 11099, + "estival": 11100, + "levision": 11101, + "Ġbroken": 11102, + "Ġmarriage": 11103, + "ĠWestern": 11104, + "Ġrepresents": 11105, + "ĠTitle": 11106, + "Ġss": 11107, + ".Ass": 11108, + "ongoose": 11109, + "iento": 11110, + "<>();Ċ": 11111, + "Ġabsolutely": 11112, + "Ġsmooth": 11113, + "TERN": 11114, + "ĠUnless": 11115, + "Word": 11116, + "Ġmerge": 11117, + "igan": 11118, + "ĠVol": 11119, + "Ġnn": 11120, + ".getId": 11121, + "Ġз": 11122, + "171": 11123, + "Ġsexy": 11124, + "Ġseeking": 11125, + "Single": 11126, + ".this": 11127, + "179": 11128, + "Ġkom": 11129, + "bound": 11130, + ";\"": 11131, + "ĠfontSize": 11132, + "_df": 11133, + "Ġinjury": 11134, + "(H": 11135, + "Ġissued": 11136, + "_END": 11137, + ":self": 11138, + "020": 11139, + "Ġpatch": 11140, + "Ġleaves": 11141, + "Ġadopt": 11142, + "FileName": 11143, + "ãĢIJ": 11144, + "Ġexecutive": 11145, + "ĠByte": 11146, + "]))Ċ": 11147, + "Ġnu": 11148, + "outing": 11149, + "cluding": 11150, + "-R": 11151, + ".options": 11152, + "Ġsubstant": 11153, + "avax": 11154, + "ĠBUT": 11155, + "Ġtechnical": 11156, + "Ġtwice": 11157, + "Ġmás": 11158, + "Ġunivers": 11159, + "yr": 11160, + "Ġdrag": 11161, + "ĠDC": 11162, + "Ġsed": 11163, + "Ġbot": 11164, + "ĠPal": 11165, + "ĠHall": 11166, + "forcement": 11167, + "Ġauch": 11168, + ".mod": 11169, + "notation": 11170, + "_files": 11171, + ".line": 11172, + "_flag": 11173, + "[name": 11174, + "Ġresolution": 11175, + "Ġbott": 11176, + "(\"[": 11177, + "ende": 11178, + "(arr": 11179, + "Free": 11180, + "(@\"": 11181, + "ĠDistrict": 11182, + "PEC": 11183, + ":-": 11184, + "Picker": 11185, + "ĠJo": 11186, + "ĠĠĠĠĠĊ": 11187, + "ĠRiver": 11188, + "_rows": 11189, + "Ġhelpful": 11190, + "Ġmassive": 11191, + "---Ċ": 11192, + "Ġmeasures": 11193, + "007": 11194, + "ĠRuntime": 11195, + "Ġworry": 11196, + "ĠSpec": 11197, + "ĉD": 11198, + "ãĢij": 11199, + "Ġ){Ċ": 11200, + "Ġworse": 11201, + "(filename": 11202, + "Ġlay": 11203, + "Ġmagic": 11204, + "ĠTheir": 11205, + "oul": 11206, + "stroy": 11207, + "ĠWhere": 11208, + "280": 11209, + "Ġsudden": 11210, + "Ġdefe": 11211, + "Ġbinding": 11212, + "Ġflight": 11213, + "ĠOnInit": 11214, + "ĠWomen": 11215, + "ĠPolicy": 11216, + "Ġdrugs": 11217, + "ishing": 11218, + "('../": 11219, + "ĠMel": 11220, + "peat": 11221, + "tor": 11222, + "Ġproposed": 11223, + "Ġstated": 11224, + "_RES": 11225, + "Ġeast": 11226, + "212": 11227, + "ĠCONDITION": 11228, + "_desc": 11229, + "Ġwinning": 11230, + "folio": 11231, + "Mapper": 11232, + "ĠPan": 11233, + "ĠAnge": 11234, + ".servlet": 11235, + "Ġcopies": 11236, + "LM": 11237, + "Ġvm": 11238, + "åį": 11239, + "Ġdictionary": 11240, + "Seg": 11241, + "177": 11242, + "elines": 11243, + "ĠSend": 11244, + "Ġiron": 11245, + "ĠFort": 11246, + "166": 11247, + ".domain": 11248, + "Ġdebate": 11249, + "NotNull": 11250, + "eq": 11251, + "acher": 11252, + "lf": 11253, + "ĉfmt": 11254, + "Ġlawy": 11255, + "178": 11256, + "ÄŁ": 11257, + "ĠMen": 11258, + "Ġtrim": 11259, + "(NULL": 11260, + "Ġ!!": 11261, + "Ġpad": 11262, + "Ġfollows": 11263, + "\"][\"": 11264, + "requ": 11265, + "ĠEp": 11266, + ".github": 11267, + "(img": 11268, + "eto": 11269, + "('\\": 11270, + "Services": 11271, + "umbnail": 11272, + "_main": 11273, + "pleted": 11274, + "fortunately": 11275, + "Ġwindows": 11276, + "Ġplane": 11277, + "ĠConnection": 11278, + ".local": 11279, + "uard": 11280, + "}\\": 11281, + "==\"": 11282, + "andon": 11283, + "ĠRoy": 11284, + "west": 11285, + "158": 11286, + "iginal": 11287, + "emies": 11288, + "itz": 11289, + "'):Ċ": 11290, + "ĠPeter": 11291, + "Ġtough": 11292, + "Ġreduced": 11293, + "Ġcalculate": 11294, + "Ġrapid": 11295, + "customer": 11296, + "Ġefficient": 11297, + "Ġmedium": 11298, + "Ġfell": 11299, + ".ref": 11300, + "ĠCas": 11301, + "Ġfeedback": 11302, + "Speed": 11303, + "(output": 11304, + "aje": 11305, + "Ġcategories": 11306, + "Ġfee": 11307, + "};": 11308, + "Ġdeleted": 11309, + "reh": 11310, + "Ġproof": 11311, + "Desc": 11312, + "Build": 11313, + "Ġsides": 11314, + ".ArrayList": 11315, + "-%": 11316, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11317, + "ر": 11318, + ".match": 11319, + "ли": 11320, + "Ġfeels": 11321, + "Ġachieve": 11322, + "Ġclim": 11323, + "_ON": 11324, + "ĠCD": 11325, + "Ġteacher": 11326, + "_current": 11327, + "bn": 11328, + "_PL": 11329, + "isting": 11330, + "Enable": 11331, + "GEN": 11332, + "Ġtv": 11333, + "Ġsock": 11334, + "Ġplays": 11335, + "Ġdiscount": 11336, + "ĠKE": 11337, + "ĠDebug": 11338, + "Fore": 11339, + "ĠIraq": 11340, + "Ġappearance": 11341, + "Mon": 11342, + "Ġstyled": 11343, + "ĠHuman": 11344, + "iot": 11345, + "ĠHistory": 11346, + "Ġsac": 11347, + "ĠCollection": 11348, + "Ġrecommended": 11349, + ".Selected": 11350, + "Ġorganizations": 11351, + "Ġdiscovered": 11352, + "cohol": 11353, + "adas": 11354, + "ĠThomas": 11355, + "May": 11356, + "Ġconserv": 11357, + "Ġdomin": 11358, + "ĠFollow": 11359, + "ĠSection": 11360, + "ĠThanks": 11361, + "Username": 11362, + "Ġrecipe": 11363, + "Ġwonderful": 11364, + ".sleep": 11365, + "_if": 11366, + "ĉĊĉĊ": 11367, + "orno": 11368, + "Ġru": 11369, + "_target": 11370, + ".\"\"": 11371, + "à¦": 11372, + "EventArgs": 11373, + "Ġinputs": 11374, + "Ġfif": 11375, + "Ġvision": 11376, + "cy": 11377, + "ĠSeries": 11378, + ")(((": 11379, + "Ġtrading": 11380, + "Ġmarker": 11381, + "Begin": 11382, + "Ġtypically": 11383, + "Ġcauses": 11384, + "dropdown": 11385, + "_DEBUG": 11386, + "260": 11387, + "Ġdetect": 11388, + "country": 11389, + "!\");Ċ": 11390, + "ĉR": 11391, + "appy": 11392, + "Ġcref": 11393, + "('<": 11394, + "\"=>": 11395, + "ĠLE": 11396, + "reader": 11397, + "Ġadministr": 11398, + "õ": 11399, + "ucket": 11400, + "Ġfashion": 11401, + ".char": 11402, + "izar": 11403, + "Ġdisable": 11404, + "Ġsuc": 11405, + "ĠLive": 11406, + "issue": 11407, + "Ġmetadata": 11408, + "flags": 11409, + "ĠðŁ": 11410, + "Ġcommitted": 11411, + "Ġva": 11412, + "Ġrough": 11413, + "Ġ'''Ċ": 11414, + "Ġhighlight": 11415, + "_vars": 11416, + "VO": 11417, + "Ġencoding": 11418, + "-Z": 11419, + "_sign": 11420, + "$(\"#": 11421, + "Ġrain": 11422, + "reatest": 11423, + "ĠEND": 11424, + "Selection": 11425, + "Ġcandidates": 11426, + "Ġsav": 11427, + ".Empty": 11428, + "Ġdecisions": 11429, + "Ġcollabor": 11430, + "ridge": 11431, + "feed": 11432, + "ression": 11433, + "Ġpersons": 11434, + "VM": 11435, + "008": 11436, + "ega": 11437, + "_BIT": 11438, + "According": 11439, + "acked": 11440, + "Ġdollars": 11441, + "_loss": 11442, + "ĠCost": 11443, + "}\"Ċ": 11444, + "Notification": 11445, + "Ġprostit": 11446, + "Ġauthority": 11447, + ".rec": 11448, + "Ġspokes": 11449, + "ĠToday": 11450, + "istant": 11451, + "ĠHead": 11452, + "âĢĿ.": 11453, + "ertainment": 11454, + "cean": 11455, + "culate": 11456, + "Ġven": 11457, + "However": 11458, + "_arr": 11459, + "Ġtokens": 11460, + "Graph": 11461, + "ĠJud": 11462, + "ĠVirgin": 11463, + "ĠSerial": 11464, + "unning": 11465, + "Mutable": 11466, + "agers": 11467, + ".csv": 11468, + "Ġdeveloping": 11469, + "Ġinstructions": 11470, + "Ġpromise": 11471, + "Ġrequested": 11472, + "_encode": 11473, + "/\"": 11474, + "ĠIcon": 11475, + "uilt": 11476, + "-day": 11477, + "Ġintelligence": 11478, + ".IS": 11479, + "ĠObservable": 11480, + "ĠHard": 11481, + "Bool": 11482, + "211": 11483, + "idential": 11484, + ".Anchor": 11485, + "Ġselling": 11486, + "CI": 11487, + "AGES": 11488, + "tle": 11489, + "bur": 11490, + "UFFER": 11491, + "RY": 11492, + "Ġbigger": 11493, + "Ġrat": 11494, + "Ġfamous": 11495, + "Ġtypename": 11496, + "Ġexplained": 11497, + "}}Ċ": 11498, + "Ġnuclear": 11499, + "-N": 11500, + "Ġcrisis": 11501, + "ĠEnter": 11502, + "Ġanswers": 11503, + "/${": 11504, + "/pl": 11505, + "Ġsequ": 11506, + "_next": 11507, + "mask": 11508, + "Ġstanding": 11509, + "Ġplenty": 11510, + "ĠCross": 11511, + "ĉret": 11512, + "dro": 11513, + "ĠCast": 11514, + "167": 11515, + "=true": 11516, + "ĠChris": 11517, + "icio": 11518, + "ĠMike": 11519, + "Decimal": 11520, + "addComponent": 11521, + "Len": 11522, + "Ġcock": 11523, + "Ġ#{": 11524, + "URN": 11525, + "": 11657, + "Ġ*=": 11658, + "ĠPS": 11659, + "Ġdangerous": 11660, + "[p": 11661, + "OME": 11662, + "Other": 11663, + "ĠStringBuilder": 11664, + "Points": 11665, + "heading": 11666, + "Ġcurrency": 11667, + "Ġpercentage": 11668, + "_API": 11669, + "Ġclassic": 11670, + "thead": 11671, + "ĠMO": 11672, + "FE": 11673, + "Idx": 11674, + "await": 11675, + "Ġè": 11676, + "Ġaccident": 11677, + "Ġvariant": 11678, + "Ġmyst": 11679, + "ĠLand": 11680, + "ĠBre": 11681, + "Ġharm": 11682, + "ĠAcc": 11683, + "Ġcharged": 11684, + "iones": 11685, + "Visibility": 11686, + "arry": 11687, + "ĠLanguage": 11688, + "Ġwalking": 11689, + "\".ĊĊ": 11690, + "ifer": 11691, + "Ġleadership": 11692, + ".From": 11693, + "ynam": 11694, + "Ġtimestamp": 11695, + "ipt": 11696, + "ĠHas": 11697, + "REFER": 11698, + "ĠIts": 11699, + "Ġlistener": 11700, + "UTE": 11701, + "213": 11702, + "_description": 11703, + "Ġexperiences": 11704, + "Ġcreates": 11705, + "RS": 11706, + "cart": 11707, + "black": 11708, + "Ġchoices": 11709, + "war": 11710, + "750": 11711, + "Ġ'''": 11712, + "Ġordered": 11713, + "Ġevening": 11714, + "Ġpil": 11715, + "Ġtun": 11716, + "ĠBad": 11717, + "(app": 11718, + "random": 11719, + "Ġexplicit": 11720, + "Ġarrived": 11721, + "Ġfly": 11722, + "Ġeconom": 11723, + "-mail": 11724, + "Ġlists": 11725, + "Ġarchitect": 11726, + "234": 11727, + "ĠPay": 11728, + "Ġds": 11729, + "ĠSol": 11730, + "Ġvehicles": 11731, + "Hz": 11732, + "-com": 11733, + "Ġking": 11734, + "_equal": 11735, + "ĠHelp": 11736, + "Ġabuse": 11737, + "480": 11738, + "169": 11739, + "--;Ċ": 11740, + "Ġextr": 11741, + "Ġchemical": 11742, + "ä¿": 11743, + "Ġorient": 11744, + "Ġbreath": 11745, + "ĠSpace": 11746, + "(element": 11747, + "wait": 11748, + "DED": 11749, + "igma": 11750, + "Ġentr": 11751, + "Ġsob": 11752, + "-name": 11753, + "Ġaffected": 11754, + "ika": 11755, + "Ġcoal": 11756, + "_work": 11757, + "Ġhundreds": 11758, + "Ġpolitics": 11759, + "subject": 11760, + "Ġconsumer": 11761, + "ANGE": 11762, + "Ġrepeated": 11763, + "Send": 11764, + "Ġ#[": 11765, + "Ġprotocol": 11766, + "Ġleads": 11767, + "useum": 11768, + "Every": 11769, + "808": 11770, + "174": 11771, + "Import": 11772, + "(count": 11773, + "Ġchallenges": 11774, + "Ġnovel": 11775, + "Ġdepart": 11776, + "bits": 11777, + ".Current": 11778, + "Ġ`${": 11779, + "oting": 11780, + "(\\": 11781, + "Ġcreative": 11782, + "Ġbuff": 11783, + "Ġintroduced": 11784, + "usic": 11785, + "modules": 11786, + "Are": 11787, + "-doc": 11788, + "language": 11789, + "_cache": 11790, + "Ġtod": 11791, + "?>": 11792, + "omething": 11793, + "Ġhun": 11794, + "åº": 11795, + "aters": 11796, + "Intent": 11797, + "Ġimplemented": 11798, + "ĠCase": 11799, + "Children": 11800, + "Ġnotification": 11801, + "Renderer": 11802, + "Wrapper": 11803, + "Objects": 11804, + "tl": 11805, + ".Contains": 11806, + "Plugin": 11807, + ".row": 11808, + "Ġforg": 11809, + "Ġpermit": 11810, + "Ġtargets": 11811, + "ĠIF": 11812, + "Ġtip": 11813, + "sex": 11814, + "Ġsupports": 11815, + "Ġfold": 11816, + "photo": 11817, + "},čĊ": 11818, + "Ġgoogle": 11819, + "$('#": 11820, + "Ġsharing": 11821, + "Ġgoods": 11822, + "vs": 11823, + "ĠDan": 11824, + "Rate": 11825, + "ĠMartin": 11826, + "Ġmanner": 11827, + "lie": 11828, + ".The": 11829, + "Internal": 11830, + "ĠCONTR": 11831, + "Mock": 11832, + "RIGHT": 11833, + "Ġ'{": 11834, + "Ġcontrols": 11835, + "Mat": 11836, + "Ġmand": 11837, + "Ġextended": 11838, + "Ok": 11839, + "Ġembed": 11840, + "Ġplanet": 11841, + "ĠNon": 11842, + "-ch": 11843, + ")\",": 11844, + "epar": 11845, + "Ġbelieved": 11846, + "ĠEnvironment": 11847, + "ĠFriend": 11848, + "-res": 11849, + "Ġhandling": 11850, + "nic": 11851, + "-level": 11852, + "scri": 11853, + "Xml": 11854, + "BE": 11855, + "ungen": 11856, + "Ġalter": 11857, + "[idx": 11858, + "Pop": 11859, + "cam": 11860, + "Ġ(((": 11861, + "Ġshipping": 11862, + "Ġbattery": 11863, + "iddleware": 11864, + "MC": 11865, + "Ġimpl": 11866, + "otation": 11867, + "ĠLab": 11868, + "