diff --git a/mlc-chat-config.json b/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..32261992526a15f3aae74cf0af97c78af43af9f7
--- /dev/null
+++ b/mlc-chat-config.json
@@ -0,0 +1,87 @@
+{
+ "version": "0.1.0",
+ "model_type": "llama",
+ "quantization": "q4f32_1",
+ "model_config": {
+ "hidden_size": 8192,
+ "intermediate_size": 28672,
+ "num_attention_heads": 64,
+ "num_hidden_layers": 80,
+ "rms_norm_eps": 1e-05,
+ "vocab_size": 128256,
+ "tie_word_embeddings": false,
+ "position_embedding_base": 500000.0,
+ "rope_scaling": {
+ "factor": 8.0,
+ "high_freq_factor": 4.0,
+ "low_freq_factor": 1.0,
+ "original_max_position_embeddings": 8192,
+ "rope_type": "llama3"
+ },
+ "context_window_size": 131072,
+ "prefill_chunk_size": 8192,
+ "num_key_value_heads": 8,
+ "head_dim": 128,
+ "tensor_parallel_shards": 1,
+ "pipeline_parallel_stages": 1,
+ "max_batch_size": 128,
+ "disaggregation": false
+ },
+ "vocab_size": 128256,
+ "context_window_size": 131072,
+ "sliding_window_size": -1,
+ "prefill_chunk_size": 8192,
+ "attention_sink_size": -1,
+ "tensor_parallel_shards": 1,
+ "pipeline_parallel_stages": 1,
+ "temperature": 1.0,
+ "presence_penalty": 0.0,
+ "frequency_penalty": 0.0,
+ "repetition_penalty": 1.0,
+ "top_p": 1.0,
+ "tokenizer_files": [
+ "tokenizer.json",
+ "tokenizer_config.json"
+ ],
+ "tokenizer_info": {
+ "token_postproc_method": "byte_level",
+ "prepend_space_in_encode": false,
+ "strip_space_in_decode": false
+ },
+ "conv_template": {
+ "name": "deepseek_v3",
+ "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
+ "system_message": "You are a helpful assistant.",
+ "system_prefix_token_ids": null,
+ "add_role_after_system_message": true,
+ "roles": {
+ "user": "<\uff5cUser\uff5c>",
+ "assistant": "<\uff5cAssistant\uff5c>"
+ },
+ "role_templates": {
+ "user": "{user_message}",
+ "assistant": "{assistant_message}",
+ "tool": "{tool_message}"
+ },
+ "messages": [],
+ "seps": [
+ "",
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
+ ],
+ "role_content_sep": "",
+ "role_empty_sep": "",
+ "stop_str": [],
+ "stop_token_ids": [
+ 151643
+ ],
+ "function_string": "",
+ "use_function_calling": false
+ },
+ "pad_token_id": 0,
+ "bos_token_id": 128000,
+ "eos_token_id": [
+ 128001,
+ 128008,
+ 128009
+ ]
+}
\ No newline at end of file
diff --git a/ndarray-cache-b16.json b/ndarray-cache-b16.json
new file mode 100644
index 0000000000000000000000000000000000000000..c5c3ce71d5fd2866241582f5994d4c6bf5c79c9a
--- /dev/null
+++ b/ndarray-cache-b16.json
@@ -0,0 +1,12575 @@
+{
+ "metadata": {
+ "ParamSize": 805,
+ "ParamBytes": 44100517888.0,
+ "BitsPerParam": 5.000504730733063
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3eb26648b5f558c692400dae6a251733"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6614898e29505f2d0e0babc3a8f5a8ad"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "efdd06442457ffd780ddd35f931a09d4"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8850ad695e7afbe4ab9d9c117f849ad"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fbee9a834a04271177eec1f8ec61fce3"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "34679a78732edb94cf53ae1791feb1a8"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23b299ecfc24900893b39ceaa140ad8b"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f3e2de86ad9b3da11898710282258c48"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55d0aac8c1a5961e4fc3c16d7f2e9096"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 29392896,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 9437184
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 24117248
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 24133632
+ },
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "00090d155aaa516834e659a64d9c70d3"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b62e7c2749ac6970811a8e26a3ba788"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f12ce6badf344ad78598c1ffd61c69f9"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "464d55f11ee4c81019703dd9ebb76ad2"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c4348309d8bf34e3064082ef7a9b02d9"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8326a3e3650ee0eee56cb611cbb1cc39"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "267dc9ee7792f6eba8dfd6bc41eba9dd"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "adeba438497ca117f77e292d2191524b"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63932f5deb9b9a4f22e88bb9d1a759b9"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 28344320,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 4194304
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 18874368
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 18890752
+ },
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 18907136
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "08fba2c7c7769ed2924abc240b825f34"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "afbdabfc265864a6858cb77206425f10"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "86b98ed8cc26327aa77182790730613d"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e416beba5ca69428be3d878dd52258a"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "629054b59c411ca27f304bde0ca8ec11"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eed27800592c2b6f7ace199ba5277e5d"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "aef1bcf12f8a17012a532a62008ae498"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e74b7bb95f07d25fee278a1c21250651"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fba5302eb11121acbd0d212619577572"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "914346101f63ff7a22c27e7f8c5fcec9"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5986b1ee36dd2609da5f3a4b26cbab55"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7f19408534c249089ef6d1b7fc662f2c"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e991852788848ffb70815d67338aed33"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4a2a3f013d2cb2c2ed981628976f0b0"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce2f608967b1b6e9e5e196006cd04c4f"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "be3019ccd048a09d6a567f616c63b275"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "995cd73c27ccbd925f2b994d6b9c7425"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f9ee3dc0c868c97e03204426539e9ec"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8e2d217533fb9e5c82164836fa466b6f"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f49b1801eb1e95ee0bd6d5e7b390e1c1"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "278fe924ac8163c001173ef539c7b790"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "35645356d8bd6a6b060d2b9c71423c98"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6a28490fde27c05d20ff6b923197868a"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85a080cd0153c1226cd9480f63cf6444"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1e502e5af50c73f26cffa06794804a8c"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c12e6371a022cfdf76948e7f5e07a32"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a26ba7c58090a1d5f212da938297685d"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0028141ffb7af45b7b52767d7572342"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a3c7d689e4e1ce6165cf306ed0e8e6f"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b8ef534bc5d03540808c00c50b3694f"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8740ca9961626aeac52dedb3aefa8c3f"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "318f8c4417d7771cf96a6fc4f74db8e7"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "780e1b9d580672748486bb92723f1d00"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79d8a47372051b23ffcc074fcf91ec1b"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b001d8dd735c18e80f18d029f8a9dfe4"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88b11385c9d3f97f8136d748d98af6ee"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6b5ea17d47d1241c525ef7d300ccfdce"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e38a758a29467975b51ea8a471d96120"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3e588c86fcc28d1447c5c2a8b88822bf"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f01e793ac96b95b397225fac1e6966e3"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7ec5780c491a793bef7a298d9b47b097"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8e8a879b80002d2db5864dca65654bfe"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e011c4fc71dbe9c4fe180ea51d500393"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d736066762d2bc7ddcbd6766b0b4a47"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d6d150533592a006b57fd48555bf1793"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a157ca2a7fe7dcc73234acb3f29c815"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "45eefd20c8ebff790773148a1df27970"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9df9c9a5c5509de08a813b8c2925f848"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5bc22833ebccfdb544225a82585b1a9e"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ede843d9e31f6611379dc25d0a03b2a5"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3036941cd629429c0b1b5d8f8fcb6198"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "261470f35c4ebf6e6ec67b38ea48d97f"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "259914fec9efdedc15d2f21851c58a87"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0de3b04c86368247ab7bb63fd8134265"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "ea0d86fe14ee766d8fdf54bc79890ee6"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c1fa9ec6e14b644902fac961e6199da6"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59856ad446fb398eec944a29fdbce8ee"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "435ec5f2733708e8c94e0a73e26cf098"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "900ee62734deb08982ad0c83cdf0703b"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "179e23f31518b761ebfd29e57e145dd3"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "dc21b4f0703c8e641421c191df3b87b2"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ad1e7a7d841152768bba079f7563a9b3"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ba48f1bfc5874ad31e4a7c950bcc59d"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "11ecef06e3163b47fafaf626dad32a32"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dbddebd2c2708539b0a7c3ad1234bd2f"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "279584698884b03ad15c20b493cba4e8"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3b8a367ebebe083efc8a2e17fc4a819a"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a999c4acefb580d544c449eb51f6588b"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42c432c0529e40df61f72182d2bca4fc"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "012d88f7356ecd458a4dfa3c974ab2a7"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af4e465210e4e584b2704f7adca422ad"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "94fd31634cba092e8dfe3be95620dc0b"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "db5465ca370160ef1c9094791bed386a"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2cf581a6b4c0fd1519d107309e3fb5c4"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "292823c7db6620c7a9e274b3f605ebb4"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f5c08b22ca93f45e2012efa861e586b"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51cb39911a379d88e1c0de84a2b0b43b"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9611a3024ce88c69b95e34b241e22a67"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0eaabf9beb5bbdc9bd46a0d62aa1c443"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "343784019e030443b34d06730510da34"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb11603e3b3ecba3c3164b5cd0f40c04"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c268018e057189582206c515fd66157f"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe6cc2707a9b4de91104c873ee47ebc3"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d92c13cb2ce5a0bb961b9f32d7f85452"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d4e670a27a514c4f074fe6419af4e907"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c420ef4da23f5b1bffa0d3544fa1f76"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a6633e9e16c5576c93b44ef8213a5f8"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9d62baebfeb51a723b945abb8604d211"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "48b7f2b7814e22a3543523d955acb68d"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "68d4697910406651d71b0f3162bb6b98"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "bd0d3f39b60911f1f78322f415737454"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1417adb69974e8c6b3802a23ce782627"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1dd528fdf6e0eae9939eb7fdfd4d1c16"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "20136b10a5376e92c58a7b42cd37baf1"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "163fe6673f6262094e028c589fcebf8d"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63e3dbe14f2faeb8120e90baae253245"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "299431a3094815ea7546661af24f19b6"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "793b305e1045d4d53f9513e1f3e6b940"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0ad612a786ca67543a7454602d72b5d8"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a922fb3c0503eccfd7e100b879acedc"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ecd2e5512cc98722f01a0c538876a87"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "72552d30d13a19426acb7b4732540841"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "54c92979854fb480f6c99da98f34554d"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9f3e49492661d523d8b12896c3472a48"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dc90d74b7fb51dd9de52ae7c2b0403e7"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0fdade6cb70a87de2dc82edb93c860b4"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "82d20d0be1c6ec3cbf0ac229e491fc6f"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9f889371e4ef6bc2f5472ea87e182f66"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0f4e5929575191b98a434b8ebeb87923"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88d2dae990cf124e47c4cbec08922c0f"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61a3773fa5103d8d9af46c6ddd771ed2"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f815a46f52c2cf2d5b10534b692a7084"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fca70d337a5e874a836cb59b93f6dd07"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "39008841620c74ca1aef4ac58cb91898"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "18f1ee4ef2f0edb4d4093ba63343661a"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dce00e7be553167dbfe25733e7272004"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a31d79d41f5c0516010708715c1d197"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ddca491c7f32720f4e0fde60b01867c"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0510fb8fc6ba6aa988fff213625bbf2e"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c9a1a8cd6f9efa89ff72b785eba6cb3"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "95a0251da5c59a1488f7bab7c9437c8c"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51ecac71550791e32b663c50a712b74c"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e11e3bbe5504cbb61ed1ef1b45d285a2"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c42412a1bcf6316a397122710b6aaed9"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebff967a51662bfef80207925fdb5fe5"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "012df5ba5975d1d67e2ea01e35d64b74"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "df3fd3bce358f5512660b767a2f0d470"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a004d23951ff9e6f46a096438cbfb525"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "752af7daac637ac980fdf8a8242402af"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4608b218b2d2147ce9dae5c2e8c80844"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3e61e1e3b29b53f76eaadf73ac9b1bed"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "336b672f32392ad02a2915a0217638ae"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eb6438744630c9dba1833260312b6916"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9e0b6a7ef340b452038b6a068f150282"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eabf7be6e36f92b6c1d0b357121b6876"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59b910ba6202389ccaacd5a42090f307"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "50efb68839c84863b00532e8d64b608e"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "398cd429fd799a93768d33504916081c"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "efe9e993dccb9d68e06dab611bfc36b0"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "03bc60d040f94d59f9234d20dee210f0"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "427634e75a9241cc3f854808b51104c0"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d3d6e46e1573a131d052d4a8a809933"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "86cc6ce7494fdcc87dedc08e61666fd9"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7acd46d2ec176557e6a923a1f71dba55"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1b0ca4a2736271af9deeb85f3785f673"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e0395aeaecf379d4999b517de047123e"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2dc39db68b5b2dfefc1679917778fd09"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "992a5605cc94fbaf37a512cda0b9efcf"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e98aeeb02e5c206e84969be9c48854b6"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7d4b4516f376412d32abd1013606fae2"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a2807bc5935eb942e1817c8fe1b8322f"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d819779db0bde9fa3c1a70f55491c61d"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d3d8819159487ae524710f6a55ef9d2"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "618eb3aeb92661136270d8ec97b0cf4f"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d43fe48134e25129b33918d3a26d5682"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c309b9e8f3b033cdcd66f6ee8db4473c"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "94af18c8b8fe4d27e28c9c52ad63c5ca"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1da157f2f03c353d2a8582b0d03ad768"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5c4557746e06e32ce52b56d75f0ad06c"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fff58269ba29baebbc874b9c6c4b5403"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d6122af64356560bc287c1125185d663"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37a369325d9983fa3ed0d16de0c0c558"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "2c0425710d04da33f8b835837eae4f20"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e458229df6e5ecdb10f5f2383ee8f4e2"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7e9041ba5738626f2363819d66f5fdcf"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ca86004b746ebb1f10566cfc6a704212"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3f8d5aa4098028454ed8f9f2b930bfee"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2a75e74802eab2a18541c1abf68e99b"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9f9a3353e559a79896d1ee4e624fcf60"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7f0da08dbff64b51d6a83a42d6d6283f"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ece3079612afeac7e4f0c3f3cb6494b"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e33a1365da838d45459f80f103e9fc37"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6552ce348c8a047340e42eb3231ecd73"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d326a209b36ecaac84a9555afec375b"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3e278836a2028f736eca4befe008e448"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23d4cfe104b485aeda3174d1cea8c6cc"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f914c1e208e39d6e642a57c1ab2afd10"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "860b61044b798014c357ff6f10d9beb3"
+ },
+ {
+ "dataPath": "params_shard_196.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "06fe33bae3deb07dfaeff1634ead9d06"
+ },
+ {
+ "dataPath": "params_shard_197.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57a2edaf53dd318c2dd12130c8f188ae"
+ },
+ {
+ "dataPath": "params_shard_198.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "f475fcad33025680e317391b2e2b2c6c"
+ },
+ {
+ "dataPath": "params_shard_199.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae993c62edff8bf94208677c0d49a922"
+ },
+ {
+ "dataPath": "params_shard_200.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a3c358b2fe0cac2c3b5a6f9cc5ab5ff0"
+ },
+ {
+ "dataPath": "params_shard_201.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3929388efbdda78ae51cb20caba9e8f4"
+ },
+ {
+ "dataPath": "params_shard_202.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa67735df41736918e8f5feb78f795d3"
+ },
+ {
+ "dataPath": "params_shard_203.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf1265578a5f4cda15619d20aa083162"
+ },
+ {
+ "dataPath": "params_shard_204.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "cb0a72057d3ad00f41f88f60717674ff"
+ },
+ {
+ "dataPath": "params_shard_205.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c11f4d93900befbc0ee0e1521f525a6"
+ },
+ {
+ "dataPath": "params_shard_206.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62523fc73cdb0b835ed06b69541622bf"
+ },
+ {
+ "dataPath": "params_shard_207.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "126dae4364f9217715e68722ecd0c348"
+ },
+ {
+ "dataPath": "params_shard_208.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "278a6d3012d2ffe18d6ff3de86aae1ee"
+ },
+ {
+ "dataPath": "params_shard_209.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "96a7f432c31c04dbf1a18ecd9227fc7b"
+ },
+ {
+ "dataPath": "params_shard_210.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "512877b6be9a639179cb63c69f06a1cd"
+ },
+ {
+ "dataPath": "params_shard_211.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bc43df6ca930bf4275f1c70aa4802e07"
+ },
+ {
+ "dataPath": "params_shard_212.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cefa27e004118023dc49e2ef4ae9b669"
+ },
+ {
+ "dataPath": "params_shard_213.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3f76e710be6bf2972494cd7d022d6e12"
+ },
+ {
+ "dataPath": "params_shard_214.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b139a50aad55fc83f6394eeeb29c6f52"
+ },
+ {
+ "dataPath": "params_shard_215.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e29ff26cf3a9bcc5da4844e46db7536f"
+ },
+ {
+ "dataPath": "params_shard_216.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a8b3748269d3f95c1d1370e8a8ebdd50"
+ },
+ {
+ "dataPath": "params_shard_217.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bed782fd09e45c347ad559e8e5072ffa"
+ },
+ {
+ "dataPath": "params_shard_218.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cfb21936fd9b599c845b13bd075d9ea"
+ },
+ {
+ "dataPath": "params_shard_219.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2725974f1510c1d403354c7c179cc4d1"
+ },
+ {
+ "dataPath": "params_shard_220.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8becd3bddf39d86a2c6620f4ab7ac2f3"
+ },
+ {
+ "dataPath": "params_shard_221.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b1cb0cbadbb441b3f480f943bafda8e2"
+ },
+ {
+ "dataPath": "params_shard_222.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c0bec3ec5fb95c5a1e474c7e664b8f33"
+ },
+ {
+ "dataPath": "params_shard_223.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62bd8722614fcb6a85e8acf22c7aabed"
+ },
+ {
+ "dataPath": "params_shard_224.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c748c30de74131e6f2b06724bcc4ce8e"
+ },
+ {
+ "dataPath": "params_shard_225.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "819a332430157c13e368c8c4a1285c9f"
+ },
+ {
+ "dataPath": "params_shard_226.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13e27af78e462080f98a7c6772b77b50"
+ },
+ {
+ "dataPath": "params_shard_227.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9040556dbb3661c7ba114df8368414cd"
+ },
+ {
+ "dataPath": "params_shard_228.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "725b7c787d7a55cc13d88444c6778899"
+ },
+ {
+ "dataPath": "params_shard_229.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61ac7247c58c2aac5e656029d855a07a"
+ },
+ {
+ "dataPath": "params_shard_230.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e1a9725b87546d033d43533ffa38f804"
+ },
+ {
+ "dataPath": "params_shard_231.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "284d97aa60d5afc1dfd06139a2b28f01"
+ },
+ {
+ "dataPath": "params_shard_232.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "17f81c61ca1da9e1df7db1b736ee82c7"
+ },
+ {
+ "dataPath": "params_shard_233.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79388d186722bf3a3ec58b1056da0b2b"
+ },
+ {
+ "dataPath": "params_shard_234.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "37c6c9f538b80b2baa78a7a3896bdcd4"
+ },
+ {
+ "dataPath": "params_shard_235.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e7a9e544367ca01a82bbe95427961fd0"
+ },
+ {
+ "dataPath": "params_shard_236.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9e6e53aeb67809933ea41048aad080be"
+ },
+ {
+ "dataPath": "params_shard_237.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5af9f3f393c4bd1c8f37631e2c488d32"
+ },
+ {
+ "dataPath": "params_shard_238.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a38d3c2f0192991b9b38506bd7f3f106"
+ },
+ {
+ "dataPath": "params_shard_239.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4eceb0073e3057b069134f9eff7945df"
+ },
+ {
+ "dataPath": "params_shard_240.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e68d3c7895452981dd0518a9b44ea776"
+ },
+ {
+ "dataPath": "params_shard_241.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ea6d86343e1855258dc182a800a4d2b5"
+ },
+ {
+ "dataPath": "params_shard_242.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0aa61fbea8a0e31e416deef0c16773b8"
+ },
+ {
+ "dataPath": "params_shard_243.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d778a8241c6a321827742aee3f35b12c"
+ },
+ {
+ "dataPath": "params_shard_244.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15e031314915146ad0e5c014b3de5987"
+ },
+ {
+ "dataPath": "params_shard_245.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e4045c6c5758dadce200c66ad7caedf9"
+ },
+ {
+ "dataPath": "params_shard_246.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "7278f0271d5dd479d62f1c3439eca83f"
+ },
+ {
+ "dataPath": "params_shard_247.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7dc217df3c8cc97a3744962d5acee566"
+ },
+ {
+ "dataPath": "params_shard_248.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f6f0e9975de5fa8c46628ade3b5484da"
+ },
+ {
+ "dataPath": "params_shard_249.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c03306a51bfa6fe745b7d5d2f9732a97"
+ },
+ {
+ "dataPath": "params_shard_250.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "822fed4f6b5538648ad0042d2841a23d"
+ },
+ {
+ "dataPath": "params_shard_251.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e9fd0ec34ac9759a07281a2b1d8f25c7"
+ },
+ {
+ "dataPath": "params_shard_252.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b3fda6a1b99f53cb4ba29d9c514016e6"
+ },
+ {
+ "dataPath": "params_shard_253.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a7c46de7f9fd9bf79d08ccb8b53adc5"
+ },
+ {
+ "dataPath": "params_shard_254.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a835ca06c0839e8d6f5a96ed2bebfca"
+ },
+ {
+ "dataPath": "params_shard_255.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "131d7d71345e3a0078520a1c463600b4"
+ },
+ {
+ "dataPath": "params_shard_256.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5a4a4eaab2c04e8c56024e99f4ec365"
+ },
+ {
+ "dataPath": "params_shard_257.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2451b322968cb0820b4c857937f39ee"
+ },
+ {
+ "dataPath": "params_shard_258.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "af6878f0a029845d141bd54d41813582"
+ },
+ {
+ "dataPath": "params_shard_259.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "374625e7f063378799667dd3d28791cc"
+ },
+ {
+ "dataPath": "params_shard_260.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae3e41a16e5cf31b113e35a2fdcb17cb"
+ },
+ {
+ "dataPath": "params_shard_261.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e28fd4dc34f1e77922e7711cb84bdb0d"
+ },
+ {
+ "dataPath": "params_shard_262.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24d43470b2a61851f1d0aa724f65ba5b"
+ },
+ {
+ "dataPath": "params_shard_263.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b6758a378cc7c6a71d980813d50ac56"
+ },
+ {
+ "dataPath": "params_shard_264.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "4ca2411153668532408d64b41f844e36"
+ },
+ {
+ "dataPath": "params_shard_265.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2611f4a9cb926c71ada5888092ca0034"
+ },
+ {
+ "dataPath": "params_shard_266.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3a98a8e146848847f848164aa9d0312"
+ },
+ {
+ "dataPath": "params_shard_267.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ca9ada01e9a0540a3abc940199e16f53"
+ },
+ {
+ "dataPath": "params_shard_268.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae823724cf8520b16cadc221c5ea97d9"
+ },
+ {
+ "dataPath": "params_shard_269.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cd901a127dc79e2ed2a764715fbb018a"
+ },
+ {
+ "dataPath": "params_shard_270.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d30ad2527e11a540d5ee02e044f28420"
+ },
+ {
+ "dataPath": "params_shard_271.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b19ebcd6bda0f55e1d4f0b376f91767a"
+ },
+ {
+ "dataPath": "params_shard_272.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dfa8692ad9cd6ddb99cf4e1d496d2c69"
+ },
+ {
+ "dataPath": "params_shard_273.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "46fd1fcaf5489e7e2a10c78a6be74838"
+ },
+ {
+ "dataPath": "params_shard_274.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "adbe51be2b94e9629894b5804e0e9407"
+ },
+ {
+ "dataPath": "params_shard_275.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e57fb8307e7cf8fe2d8b831f8cf4975e"
+ },
+ {
+ "dataPath": "params_shard_276.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "05c499c5b9d362c3b877635ca39cfc21"
+ },
+ {
+ "dataPath": "params_shard_277.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b6e5f4be3e833a985468ca67e993a1e5"
+ },
+ {
+ "dataPath": "params_shard_278.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8fcffc0ba2a11858a2b2ebc79360761"
+ },
+ {
+ "dataPath": "params_shard_279.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe795e1ffe879aa8e87c2528531c60d8"
+ },
+ {
+ "dataPath": "params_shard_280.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a20e3cc24bb52d6f5b3bd9b99fb1f7b9"
+ },
+ {
+ "dataPath": "params_shard_281.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f2ac52a6590269469fd50fcf884cd508"
+ },
+ {
+ "dataPath": "params_shard_282.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5ac56d3c461228107ebee3911676919d"
+ },
+ {
+ "dataPath": "params_shard_283.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "663c3f34e89b5b517bb381fbfe7557ac"
+ },
+ {
+ "dataPath": "params_shard_284.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d4982bd9762ec3aa8d6fa40208c143dc"
+ },
+ {
+ "dataPath": "params_shard_285.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5c0b8f0e14b6d20379753bbeb29ea36"
+ },
+ {
+ "dataPath": "params_shard_286.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a29cbee9a62d505d7a6ae1e9593e7ed1"
+ },
+ {
+ "dataPath": "params_shard_287.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac4b080929fc92ec0e9a6d2066712e61"
+ },
+ {
+ "dataPath": "params_shard_288.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "438f04bd27d7883939b2822cd82fc9f4"
+ },
+ {
+ "dataPath": "params_shard_289.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9597f604ee79e59e3233da7d887cc667"
+ },
+ {
+ "dataPath": "params_shard_290.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25c626e13186bfb968a027b8ad75669f"
+ },
+ {
+ "dataPath": "params_shard_291.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9aa82634e22ce3364646ff4ee282843c"
+ },
+ {
+ "dataPath": "params_shard_292.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16c081950fb0a203c7fe517221bac632"
+ },
+ {
+ "dataPath": "params_shard_293.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b75130a9426cc5878ca7adc37feb5d06"
+ },
+ {
+ "dataPath": "params_shard_294.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "67183418d9b0584f5709593da8b4067f"
+ },
+ {
+ "dataPath": "params_shard_295.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9889d460341c02d901966596bf262cdc"
+ },
+ {
+ "dataPath": "params_shard_296.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7c22439b8a2ff2cbbc205a820e68988e"
+ },
+ {
+ "dataPath": "params_shard_297.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24bd92886bf03a9360245a7b415f8013"
+ },
+ {
+ "dataPath": "params_shard_298.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "07cc9229afe6edc077bdb3a397051d0d"
+ },
+ {
+ "dataPath": "params_shard_299.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4764653c765376f01e1f11148f024c00"
+ },
+ {
+ "dataPath": "params_shard_300.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.48.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.48.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3a047aeb9c0455902eef0084424d05ef"
+ },
+ {
+ "dataPath": "params_shard_301.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e35827193c0dd5e8bba0c6d37d179b06"
+ },
+ {
+ "dataPath": "params_shard_302.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37bdea87bd37d94a0af44cba9d6916ff"
+ },
+ {
+ "dataPath": "params_shard_303.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5b3d8d72605fc3ba49ef5e458593a24"
+ },
+ {
+ "dataPath": "params_shard_304.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87a7707a1f51ab39f09ee8da7701c9df"
+ },
+ {
+ "dataPath": "params_shard_305.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ab4d4423853cd949d394c0a7dbc5e2e"
+ },
+ {
+ "dataPath": "params_shard_306.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.49.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.49.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5008d6497bda2c5bacc357c4975d84dc"
+ },
+ {
+ "dataPath": "params_shard_307.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "898769e571cfbbe506662c5af71fd627"
+ },
+ {
+ "dataPath": "params_shard_308.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "67caa3dfc7f6df3c7bc411429a957034"
+ },
+ {
+ "dataPath": "params_shard_309.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c12ba3baecf6319317e023fc4ea1236d"
+ },
+ {
+ "dataPath": "params_shard_310.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "642c08c68d1456774cddb62d0d1d37bc"
+ },
+ {
+ "dataPath": "params_shard_311.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce5207136300d3fe4a0ab9f5b523c136"
+ },
+ {
+ "dataPath": "params_shard_312.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.50.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.50.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "28e733c6c84e569f87697b2a7a48bfaf"
+ },
+ {
+ "dataPath": "params_shard_313.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4e5987d3244c48b3aa0d46d1ceee2951"
+ },
+ {
+ "dataPath": "params_shard_314.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a173c5c565bc1892cfbfd258c1cb6289"
+ },
+ {
+ "dataPath": "params_shard_315.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25394fc7a51a99827c101012ac3f5f19"
+ },
+ {
+ "dataPath": "params_shard_316.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b6f6ab4f9a40ec72cc039bb6840550bf"
+ },
+ {
+ "dataPath": "params_shard_317.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1bdc90db1498982bf164fb79785c876d"
+ },
+ {
+ "dataPath": "params_shard_318.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.51.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.51.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0cc4e820530177a74513adb27afbd9c8"
+ },
+ {
+ "dataPath": "params_shard_319.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fd96917f49ea5f021c4c33d30bed32b4"
+ },
+ {
+ "dataPath": "params_shard_320.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "41c50491e9d060338cb630ab2ba88999"
+ },
+ {
+ "dataPath": "params_shard_321.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bab4e1a1288bd5314754b46774495237"
+ },
+ {
+ "dataPath": "params_shard_322.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7c13baaa72e3f7916d895b1ec526977c"
+ },
+ {
+ "dataPath": "params_shard_323.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19f2d96ab3750265f7f12328aae4b322"
+ },
+ {
+ "dataPath": "params_shard_324.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.52.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.52.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "01882d19d9896aa4f0e2f684bed12034"
+ },
+ {
+ "dataPath": "params_shard_325.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8b466389d5e67a19cfaf0cbe6dd8ba37"
+ },
+ {
+ "dataPath": "params_shard_326.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e8acffaf0096d5dfdb61a156a7fd4a1"
+ },
+ {
+ "dataPath": "params_shard_327.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b953a0e2f17d9d48281e62021524013"
+ },
+ {
+ "dataPath": "params_shard_328.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9a1a10b192e1f02c27370661bce28fb8"
+ },
+ {
+ "dataPath": "params_shard_329.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2d3f3e3b1e39e0f79967860b7eb6a76"
+ },
+ {
+ "dataPath": "params_shard_330.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.53.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.53.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "774dc85439307a856b0fc4c7aeb20f18"
+ },
+ {
+ "dataPath": "params_shard_331.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e50be005424bc55d474087735ecc75e6"
+ },
+ {
+ "dataPath": "params_shard_332.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ccd3056e2ec39fec7e2252ebb7b5201"
+ },
+ {
+ "dataPath": "params_shard_333.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "894f23f697dbc67bff0d490bfe3c6ca8"
+ },
+ {
+ "dataPath": "params_shard_334.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a4794ec700952f23bc76220dd1d76ff4"
+ },
+ {
+ "dataPath": "params_shard_335.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5e2c4c525807a481f26cf25492a2f479"
+ },
+ {
+ "dataPath": "params_shard_336.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.54.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.54.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "72d56789d090541ff4e311d0a2136035"
+ },
+ {
+ "dataPath": "params_shard_337.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a22693c144d25c14ea4c4878c8ef0c06"
+ },
+ {
+ "dataPath": "params_shard_338.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63403d019ae94759c582efce72f9cc56"
+ },
+ {
+ "dataPath": "params_shard_339.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b20eb650134daeeca6eb08110c219595"
+ },
+ {
+ "dataPath": "params_shard_340.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8bfc35a9009de9225c3a12cb196e7954"
+ },
+ {
+ "dataPath": "params_shard_341.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a19d8cc746138a7b60884b207ad28ded"
+ },
+ {
+ "dataPath": "params_shard_342.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.55.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.55.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0ee1f7a8f52a37163816027cd8631d7f"
+ },
+ {
+ "dataPath": "params_shard_343.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "507c3daa67d84b90e930c67fa52a15b5"
+ },
+ {
+ "dataPath": "params_shard_344.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "db67da53b6209bf7ff8448563296d6ef"
+ },
+ {
+ "dataPath": "params_shard_345.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "67e3c67bd2a84887ba16228e28dd0ac1"
+ },
+ {
+ "dataPath": "params_shard_346.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2f6fade64d07f3ca3fbb3d257a49535a"
+ },
+ {
+ "dataPath": "params_shard_347.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16925bb2bfc6d13779512a252839c5b9"
+ },
+ {
+ "dataPath": "params_shard_348.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.56.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.56.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e03fe4d8fb5783798a74f2b88bb22f6e"
+ },
+ {
+ "dataPath": "params_shard_349.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9294f9b7199e1d8c3917ae043d9f5ff1"
+ },
+ {
+ "dataPath": "params_shard_350.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9fb78979622f2d2d1d60af9ebf040934"
+ },
+ {
+ "dataPath": "params_shard_351.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5439d9cc96994bb3978b2bedd1661a30"
+ },
+ {
+ "dataPath": "params_shard_352.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a1d1883a4127ea2ca97161a38e77357b"
+ },
+ {
+ "dataPath": "params_shard_353.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8f52ab478c45d46bfe5c1dbcca973ea"
+ },
+ {
+ "dataPath": "params_shard_354.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.57.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.57.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6bae95a7fbc2f6b207dc1b34143986df"
+ },
+ {
+ "dataPath": "params_shard_355.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62c686f0eb51e72b81732e4d0fa48e04"
+ },
+ {
+ "dataPath": "params_shard_356.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4a29ade65ec4c06248fa509a9dddf7e1"
+ },
+ {
+ "dataPath": "params_shard_357.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "28bed2c7b3b1ecdf4b4d84b6c8093498"
+ },
+ {
+ "dataPath": "params_shard_358.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26bba2dd3ca1f5993730a127ec469c31"
+ },
+ {
+ "dataPath": "params_shard_359.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79b165d2163381b9f2946e97c33b877c"
+ },
+ {
+ "dataPath": "params_shard_360.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.58.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.58.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c9c3584887279af8aa8975b33630dcbe"
+ },
+ {
+ "dataPath": "params_shard_361.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5c35e28fe19aeac8809ca6fbc65812c"
+ },
+ {
+ "dataPath": "params_shard_362.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "46abccbeaada7f1686efa4d572f2288a"
+ },
+ {
+ "dataPath": "params_shard_363.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2bfaf5563c4b8eb5ce36b2894be64da0"
+ },
+ {
+ "dataPath": "params_shard_364.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7ea0ed2d45a0289cda776e163eb62f60"
+ },
+ {
+ "dataPath": "params_shard_365.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acb215a9fb8d817566ec255a88741a4a"
+ },
+ {
+ "dataPath": "params_shard_366.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.59.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.59.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "24031b013402757a95b725d1d58c624b"
+ },
+ {
+ "dataPath": "params_shard_367.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57b888959c536bcb8bf205cc7b50152d"
+ },
+ {
+ "dataPath": "params_shard_368.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d4be0bfad9a37360e8265ebb8312f851"
+ },
+ {
+ "dataPath": "params_shard_369.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa014397cc342d8cda1359d485dbc65e"
+ },
+ {
+ "dataPath": "params_shard_370.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fc9fa177e2d442e80b365be7a2db9a92"
+ },
+ {
+ "dataPath": "params_shard_371.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acfa98e682d887344f9b823ed57c7eb1"
+ },
+ {
+ "dataPath": "params_shard_372.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.60.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.60.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9ac014c4df99567e2f0d5756e989a56e"
+ },
+ {
+ "dataPath": "params_shard_373.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d0caab08ff06305cbc7f314eb1b63c4"
+ },
+ {
+ "dataPath": "params_shard_374.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "03b557a65f7c6d9989c6979c272f4110"
+ },
+ {
+ "dataPath": "params_shard_375.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5cfee4396006c3232b8e5cbc4195e4ce"
+ },
+ {
+ "dataPath": "params_shard_376.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "01068ac29c21f9bae4d47f07afcbd742"
+ },
+ {
+ "dataPath": "params_shard_377.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84734260cde97db9b2a28884fb51840c"
+ },
+ {
+ "dataPath": "params_shard_378.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.61.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.61.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "4721356a89e76fae03225dc166c64b45"
+ },
+ {
+ "dataPath": "params_shard_379.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2bd737a0768c57fc61767eedd3da1b24"
+ },
+ {
+ "dataPath": "params_shard_380.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "775c04cdade416b12a90f76182a0e236"
+ },
+ {
+ "dataPath": "params_shard_381.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13e2e18669fa832fef5c03d4b7bf7af0"
+ },
+ {
+ "dataPath": "params_shard_382.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebf12e03b354719fb76bf41855d9cca5"
+ },
+ {
+ "dataPath": "params_shard_383.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4e2c7dfd6c7106cab04e9789c51b7ce0"
+ },
+ {
+ "dataPath": "params_shard_384.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.62.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.62.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "898ed8bebc824047cc7b661d3ecefaa9"
+ },
+ {
+ "dataPath": "params_shard_385.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5f3ecdee3ce4233813abedf394b394e1"
+ },
+ {
+ "dataPath": "params_shard_386.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9113a6c2931b3e2729e6872f9e273d60"
+ },
+ {
+ "dataPath": "params_shard_387.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6cda3ba42c9dd2b0dfde3c0da425afdc"
+ },
+ {
+ "dataPath": "params_shard_388.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "951e7a961c4b2f401a35777ef037b17b"
+ },
+ {
+ "dataPath": "params_shard_389.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "227f7680ad6a40274c63e35d1a4dba94"
+ },
+ {
+ "dataPath": "params_shard_390.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.63.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.63.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "890e02eb523a0696740e51737221a9c9"
+ },
+ {
+ "dataPath": "params_shard_391.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "89bec5040dddfe37b27f8d40388b075b"
+ },
+ {
+ "dataPath": "params_shard_392.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16da05d32abdb1ab271f1b8a3e9487d3"
+ },
+ {
+ "dataPath": "params_shard_393.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6b519f1b4763fc05c1518c9daf5c62e6"
+ },
+ {
+ "dataPath": "params_shard_394.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5c2491aafa5d89eaee143f8986625202"
+ },
+ {
+ "dataPath": "params_shard_395.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f1388f14b8986ed0a660afd2dc29b339"
+ },
+ {
+ "dataPath": "params_shard_396.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.64.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.64.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "dd39b8a131088968d99fb6a49a31f3dd"
+ },
+ {
+ "dataPath": "params_shard_397.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe1799ce3b4f78bb76b2fc7b012ad469"
+ },
+ {
+ "dataPath": "params_shard_398.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2961a9e76013f4cc8cdbb438893d7f38"
+ },
+ {
+ "dataPath": "params_shard_399.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ca2f5aef783f3434a52c1be376c5beb"
+ },
+ {
+ "dataPath": "params_shard_400.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d2d2a9ff595a15e18a1cb12f0e261c5"
+ },
+ {
+ "dataPath": "params_shard_401.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c6487217b5ca1d13e465239815e7d226"
+ },
+ {
+ "dataPath": "params_shard_402.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.65.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.65.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1ab701cd78af3b96f24c728dae932c19"
+ },
+ {
+ "dataPath": "params_shard_403.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64346add10c58ec087a6e2bad28ca61e"
+ },
+ {
+ "dataPath": "params_shard_404.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4512af4fdcd68d523299ecef9c3eb1ee"
+ },
+ {
+ "dataPath": "params_shard_405.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63ea311ecab57d56745039d9a5e44b25"
+ },
+ {
+ "dataPath": "params_shard_406.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "52243cbe67bf1680d3c2952996cb67cf"
+ },
+ {
+ "dataPath": "params_shard_407.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8836abae906061db23356323834aa9f"
+ },
+ {
+ "dataPath": "params_shard_408.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.66.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.66.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3493add60010de68c1b0a1db8642f568"
+ },
+ {
+ "dataPath": "params_shard_409.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d0362e21e91beeed36049e3cf86036d0"
+ },
+ {
+ "dataPath": "params_shard_410.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d06c6a731f5cb92546bebb797c3e8ee0"
+ },
+ {
+ "dataPath": "params_shard_411.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3d4f562b872fcf671348de7958ba5e0"
+ },
+ {
+ "dataPath": "params_shard_412.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "392c6246e17701d8d58f3c9519fdf246"
+ },
+ {
+ "dataPath": "params_shard_413.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7d9917f207a7971d0be89a473d6d8a2"
+ },
+ {
+ "dataPath": "params_shard_414.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.67.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.67.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c4f23fb0c836de7034aaf5174e1b3993"
+ },
+ {
+ "dataPath": "params_shard_415.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a1ef7b4b4311054fac6ddbfa332470a"
+ },
+ {
+ "dataPath": "params_shard_416.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b943175c25499b4aa81d59703a90c36c"
+ },
+ {
+ "dataPath": "params_shard_417.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80d85f785d6f039f694ade4180f5233e"
+ },
+ {
+ "dataPath": "params_shard_418.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "312b0ea77ec14fc0c9a2b3c730fa8a22"
+ },
+ {
+ "dataPath": "params_shard_419.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d6095a425e03e721d25322d6bbdb313"
+ },
+ {
+ "dataPath": "params_shard_420.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.68.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.68.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5907ba7f58fe04573480c56805cd06a3"
+ },
+ {
+ "dataPath": "params_shard_421.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e22ff8ce332a0a73082cc7ded803b0a6"
+ },
+ {
+ "dataPath": "params_shard_422.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "701fa19f952ffea454247cf52683c941"
+ },
+ {
+ "dataPath": "params_shard_423.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d37d1e41eb2c537081ea3da7a56fb83f"
+ },
+ {
+ "dataPath": "params_shard_424.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0a383acfadd7e07f5efbe8339b1ecb78"
+ },
+ {
+ "dataPath": "params_shard_425.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f05866dbb3cd92594a0a4ea098181859"
+ },
+ {
+ "dataPath": "params_shard_426.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.69.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.69.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6cf50e9a91ef7182e0d4f9c14a7aebd0"
+ },
+ {
+ "dataPath": "params_shard_427.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "04592ca0cfa5ad637d7b707b3806d1f9"
+ },
+ {
+ "dataPath": "params_shard_428.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "77f73fa70592063a146c366942b6da09"
+ },
+ {
+ "dataPath": "params_shard_429.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "106e2e5288c084fdf24cb38606a3f6ff"
+ },
+ {
+ "dataPath": "params_shard_430.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b5f0bb8c86151fb049b73d0257f49934"
+ },
+ {
+ "dataPath": "params_shard_431.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe705a93811b97d41e68467724808329"
+ },
+ {
+ "dataPath": "params_shard_432.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.70.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.70.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "77aef38e7f0bf3439ab56bfae82b2446"
+ },
+ {
+ "dataPath": "params_shard_433.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "205573efdcf20a2a6f05971b038aa69a"
+ },
+ {
+ "dataPath": "params_shard_434.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6340eaa9051ce7af8695f9c70e9ca666"
+ },
+ {
+ "dataPath": "params_shard_435.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c06b6f430a54095335b4bd3feb9428f"
+ },
+ {
+ "dataPath": "params_shard_436.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f24d07886cc45c582461dafe8f3992e3"
+ },
+ {
+ "dataPath": "params_shard_437.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9787e9629802560c47975b2246026c72"
+ },
+ {
+ "dataPath": "params_shard_438.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.71.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.71.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eff87eb8df2fd9d416ac8fcb82ddc0ac"
+ },
+ {
+ "dataPath": "params_shard_439.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c344c707efc2fe7949af5faab0fc97b"
+ },
+ {
+ "dataPath": "params_shard_440.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9e6d164781f9f01e1a1fb6eea09727b"
+ },
+ {
+ "dataPath": "params_shard_441.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8d6b5201fcf0b5e4589add90db02c2df"
+ },
+ {
+ "dataPath": "params_shard_442.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99be8f8ee7317bda642e36efd4b74633"
+ },
+ {
+ "dataPath": "params_shard_443.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0da75744c385e5b76de32f2aea078a2d"
+ },
+ {
+ "dataPath": "params_shard_444.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.72.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.72.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "987169a64c7af0b910d9f9c40c08a1cb"
+ },
+ {
+ "dataPath": "params_shard_445.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "047612ebde13b6d550d4878147e5ae0c"
+ },
+ {
+ "dataPath": "params_shard_446.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "669694bce70a0a7bcc7f80797884ddbd"
+ },
+ {
+ "dataPath": "params_shard_447.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87e6936a91fc544a2ebd06246fc21adc"
+ },
+ {
+ "dataPath": "params_shard_448.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5fd7ab14db07f7450e499daf593d209"
+ },
+ {
+ "dataPath": "params_shard_449.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79add4990b5f75f0954b9adc81a40bc5"
+ },
+ {
+ "dataPath": "params_shard_450.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.73.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.73.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0946db163b8643fc06667225f843a26e"
+ },
+ {
+ "dataPath": "params_shard_451.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7ac0342ba94f26e80257cd4aeca0883"
+ },
+ {
+ "dataPath": "params_shard_452.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "66201ac4a8933ce649713bfceeae54bf"
+ },
+ {
+ "dataPath": "params_shard_453.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8707b316c631457c70bd6c1b628cc64"
+ },
+ {
+ "dataPath": "params_shard_454.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64d094fc97af0753742b339583737dc7"
+ },
+ {
+ "dataPath": "params_shard_455.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "09ca1a590ceb8711607a1a0a0dd51832"
+ },
+ {
+ "dataPath": "params_shard_456.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.74.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.74.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "adb4defec811675b023e97de7eb7c733"
+ },
+ {
+ "dataPath": "params_shard_457.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "947913fc58477ab9ffa47a5b89894d65"
+ },
+ {
+ "dataPath": "params_shard_458.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2e6f1c52accfcfe9d82f10960dea6b5"
+ },
+ {
+ "dataPath": "params_shard_459.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "590199dca2c197446fbb85bd3ca43baa"
+ },
+ {
+ "dataPath": "params_shard_460.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbcff28d1dbe1a67149eedbd0014372d"
+ },
+ {
+ "dataPath": "params_shard_461.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a9923af4b76a2e3e65e4861adb27d977"
+ },
+ {
+ "dataPath": "params_shard_462.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.75.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.75.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c4ce9d733ba438afc2a724c135593f36"
+ },
+ {
+ "dataPath": "params_shard_463.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "244fb13d822be6c7d06898a735e60559"
+ },
+ {
+ "dataPath": "params_shard_464.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5853e7acdf93790a330f47580bfa51e"
+ },
+ {
+ "dataPath": "params_shard_465.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0d5c22a0a5988d73d09471d89fc163c0"
+ },
+ {
+ "dataPath": "params_shard_466.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "18acd8799ca326ebbe3a2aff29e6e3ff"
+ },
+ {
+ "dataPath": "params_shard_467.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7342c731c9ff15c5adaba8edf7b4be16"
+ },
+ {
+ "dataPath": "params_shard_468.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.76.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.76.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "cdd8135716bd2dc5b535341e3eac820c"
+ },
+ {
+ "dataPath": "params_shard_469.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8c80f59c4df01148f9c7aa0b4c025c2"
+ },
+ {
+ "dataPath": "params_shard_470.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "811de3bfa66f2f8b5dd4543560fc9d21"
+ },
+ {
+ "dataPath": "params_shard_471.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61877e6bbdce8abddaa443d87579ad99"
+ },
+ {
+ "dataPath": "params_shard_472.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6866e9fecdfe546015f91f43a79ab4ce"
+ },
+ {
+ "dataPath": "params_shard_473.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a980cbc566cf413ef9ae6dcfd704e874"
+ },
+ {
+ "dataPath": "params_shard_474.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.77.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.77.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "bff4bb2bdb94554add45ff8cdd05d1e6"
+ },
+ {
+ "dataPath": "params_shard_475.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "531fb937911ccee7083556ee675b6b14"
+ },
+ {
+ "dataPath": "params_shard_476.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "40962de371c53cf1376f752638a77bd8"
+ },
+ {
+ "dataPath": "params_shard_477.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "935323b86bd8a4818704bb722b125f78"
+ },
+ {
+ "dataPath": "params_shard_478.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42678600f504d0ef41c6cc1537a33354"
+ },
+ {
+ "dataPath": "params_shard_479.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c115c02ed782ff7ff9a7cfed9d686064"
+ },
+ {
+ "dataPath": "params_shard_480.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.78.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.78.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "fff910192a63a35b8b64b2ad87e7fa09"
+ },
+ {
+ "dataPath": "params_shard_481.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ffb9a4821e85c82ea4b4036509e192c1"
+ },
+ {
+ "dataPath": "params_shard_482.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42dcf5cff51f226c09e1243f3df821ad"
+ },
+ {
+ "dataPath": "params_shard_483.bin",
+ "format": "raw-shard",
+ "nbytes": 14729216,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.79.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.79.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 16384,
+ "byteOffset": 14712832
+ }
+ ],
+ "md5sum": "f266c5ce63191a16a76da09c5e11b48a"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..04fde1b7b2317fa5cb5a574bcc37a162e6a920ce
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,12575 @@
+{
+ "metadata": {
+ "ParamSize": 805,
+ "ParamBytes": 44100517888.0,
+ "BitsPerParam": 5.000504730733063
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3eb26648b5f558c692400dae6a251733"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6614898e29505f2d0e0babc3a8f5a8ad"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "efdd06442457ffd780ddd35f931a09d4"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8850ad695e7afbe4ab9d9c117f849ad"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fbee9a834a04271177eec1f8ec61fce3"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "34679a78732edb94cf53ae1791feb1a8"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23b299ecfc24900893b39ceaa140ad8b"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f3e2de86ad9b3da11898710282258c48"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55d0aac8c1a5961e4fc3c16d7f2e9096"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 29392896,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 9437184
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 24117248
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 24133632
+ },
+ {
+ "name": "model.layers.1.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "00090d155aaa516834e659a64d9c70d3"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b62e7c2749ac6970811a8e26a3ba788"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f12ce6badf344ad78598c1ffd61c69f9"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "464d55f11ee4c81019703dd9ebb76ad2"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c4348309d8bf34e3064082ef7a9b02d9"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8326a3e3650ee0eee56cb611cbb1cc39"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "267dc9ee7792f6eba8dfd6bc41eba9dd"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "adeba438497ca117f77e292d2191524b"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63932f5deb9b9a4f22e88bb9d1a759b9"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 28344320,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 4194304
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 18874368
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 18890752
+ },
+ {
+ "name": "model.layers.2.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 18907136
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 24150016
+ }
+ ],
+ "md5sum": "08fba2c7c7769ed2924abc240b825f34"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "afbdabfc265864a6858cb77206425f10"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "86b98ed8cc26327aa77182790730613d"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e416beba5ca69428be3d878dd52258a"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "629054b59c411ca27f304bde0ca8ec11"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eed27800592c2b6f7ace199ba5277e5d"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.3.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "aef1bcf12f8a17012a532a62008ae498"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e74b7bb95f07d25fee278a1c21250651"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fba5302eb11121acbd0d212619577572"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "914346101f63ff7a22c27e7f8c5fcec9"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5986b1ee36dd2609da5f3a4b26cbab55"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7f19408534c249089ef6d1b7fc662f2c"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.4.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e991852788848ffb70815d67338aed33"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4a2a3f013d2cb2c2ed981628976f0b0"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce2f608967b1b6e9e5e196006cd04c4f"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "be3019ccd048a09d6a567f616c63b275"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "995cd73c27ccbd925f2b994d6b9c7425"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f9ee3dc0c868c97e03204426539e9ec"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.5.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8e2d217533fb9e5c82164836fa466b6f"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f49b1801eb1e95ee0bd6d5e7b390e1c1"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "278fe924ac8163c001173ef539c7b790"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "35645356d8bd6a6b060d2b9c71423c98"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6a28490fde27c05d20ff6b923197868a"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "85a080cd0153c1226cd9480f63cf6444"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.6.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1e502e5af50c73f26cffa06794804a8c"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c12e6371a022cfdf76948e7f5e07a32"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a26ba7c58090a1d5f212da938297685d"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0028141ffb7af45b7b52767d7572342"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a3c7d689e4e1ce6165cf306ed0e8e6f"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4b8ef534bc5d03540808c00c50b3694f"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.7.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "8740ca9961626aeac52dedb3aefa8c3f"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "318f8c4417d7771cf96a6fc4f74db8e7"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "780e1b9d580672748486bb92723f1d00"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79d8a47372051b23ffcc074fcf91ec1b"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b001d8dd735c18e80f18d029f8a9dfe4"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88b11385c9d3f97f8136d748d98af6ee"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.8.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6b5ea17d47d1241c525ef7d300ccfdce"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e38a758a29467975b51ea8a471d96120"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3e588c86fcc28d1447c5c2a8b88822bf"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f01e793ac96b95b397225fac1e6966e3"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7ec5780c491a793bef7a298d9b47b097"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8e8a879b80002d2db5864dca65654bfe"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.9.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e011c4fc71dbe9c4fe180ea51d500393"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d736066762d2bc7ddcbd6766b0b4a47"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d6d150533592a006b57fd48555bf1793"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a157ca2a7fe7dcc73234acb3f29c815"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "45eefd20c8ebff790773148a1df27970"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9df9c9a5c5509de08a813b8c2925f848"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.10.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5bc22833ebccfdb544225a82585b1a9e"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ede843d9e31f6611379dc25d0a03b2a5"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3036941cd629429c0b1b5d8f8fcb6198"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "261470f35c4ebf6e6ec67b38ea48d97f"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "259914fec9efdedc15d2f21851c58a87"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0de3b04c86368247ab7bb63fd8134265"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.11.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "ea0d86fe14ee766d8fdf54bc79890ee6"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c1fa9ec6e14b644902fac961e6199da6"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59856ad446fb398eec944a29fdbce8ee"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "435ec5f2733708e8c94e0a73e26cf098"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "900ee62734deb08982ad0c83cdf0703b"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "179e23f31518b761ebfd29e57e145dd3"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.12.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "dc21b4f0703c8e641421c191df3b87b2"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ad1e7a7d841152768bba079f7563a9b3"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ba48f1bfc5874ad31e4a7c950bcc59d"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "11ecef06e3163b47fafaf626dad32a32"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dbddebd2c2708539b0a7c3ad1234bd2f"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "279584698884b03ad15c20b493cba4e8"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.13.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3b8a367ebebe083efc8a2e17fc4a819a"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a999c4acefb580d544c449eb51f6588b"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42c432c0529e40df61f72182d2bca4fc"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "012d88f7356ecd458a4dfa3c974ab2a7"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af4e465210e4e584b2704f7adca422ad"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "94fd31634cba092e8dfe3be95620dc0b"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.14.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "db5465ca370160ef1c9094791bed386a"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2cf581a6b4c0fd1519d107309e3fb5c4"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "292823c7db6620c7a9e274b3f605ebb4"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6f5c08b22ca93f45e2012efa861e586b"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51cb39911a379d88e1c0de84a2b0b43b"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9611a3024ce88c69b95e34b241e22a67"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.15.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0eaabf9beb5bbdc9bd46a0d62aa1c443"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "343784019e030443b34d06730510da34"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb11603e3b3ecba3c3164b5cd0f40c04"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c268018e057189582206c515fd66157f"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe6cc2707a9b4de91104c873ee47ebc3"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d92c13cb2ce5a0bb961b9f32d7f85452"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.16.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d4e670a27a514c4f074fe6419af4e907"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c420ef4da23f5b1bffa0d3544fa1f76"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a6633e9e16c5576c93b44ef8213a5f8"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9d62baebfeb51a723b945abb8604d211"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "48b7f2b7814e22a3543523d955acb68d"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "68d4697910406651d71b0f3162bb6b98"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.17.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "bd0d3f39b60911f1f78322f415737454"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1417adb69974e8c6b3802a23ce782627"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1dd528fdf6e0eae9939eb7fdfd4d1c16"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "20136b10a5376e92c58a7b42cd37baf1"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "163fe6673f6262094e028c589fcebf8d"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63e3dbe14f2faeb8120e90baae253245"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.18.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "299431a3094815ea7546661af24f19b6"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "793b305e1045d4d53f9513e1f3e6b940"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0ad612a786ca67543a7454602d72b5d8"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5a922fb3c0503eccfd7e100b879acedc"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ecd2e5512cc98722f01a0c538876a87"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "72552d30d13a19426acb7b4732540841"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.19.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "54c92979854fb480f6c99da98f34554d"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9f3e49492661d523d8b12896c3472a48"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dc90d74b7fb51dd9de52ae7c2b0403e7"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0fdade6cb70a87de2dc82edb93c860b4"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "82d20d0be1c6ec3cbf0ac229e491fc6f"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9f889371e4ef6bc2f5472ea87e182f66"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.20.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0f4e5929575191b98a434b8ebeb87923"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "88d2dae990cf124e47c4cbec08922c0f"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61a3773fa5103d8d9af46c6ddd771ed2"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f815a46f52c2cf2d5b10534b692a7084"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fca70d337a5e874a836cb59b93f6dd07"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "39008841620c74ca1aef4ac58cb91898"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.21.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "18f1ee4ef2f0edb4d4093ba63343661a"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dce00e7be553167dbfe25733e7272004"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a31d79d41f5c0516010708715c1d197"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ddca491c7f32720f4e0fde60b01867c"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0510fb8fc6ba6aa988fff213625bbf2e"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c9a1a8cd6f9efa89ff72b785eba6cb3"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.22.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "95a0251da5c59a1488f7bab7c9437c8c"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51ecac71550791e32b663c50a712b74c"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e11e3bbe5504cbb61ed1ef1b45d285a2"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c42412a1bcf6316a397122710b6aaed9"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebff967a51662bfef80207925fdb5fe5"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "012df5ba5975d1d67e2ea01e35d64b74"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.23.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "df3fd3bce358f5512660b767a2f0d470"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a004d23951ff9e6f46a096438cbfb525"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "752af7daac637ac980fdf8a8242402af"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4608b218b2d2147ce9dae5c2e8c80844"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3e61e1e3b29b53f76eaadf73ac9b1bed"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "336b672f32392ad02a2915a0217638ae"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.24.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eb6438744630c9dba1833260312b6916"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9e0b6a7ef340b452038b6a068f150282"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "eabf7be6e36f92b6c1d0b357121b6876"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "59b910ba6202389ccaacd5a42090f307"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "50efb68839c84863b00532e8d64b608e"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "398cd429fd799a93768d33504916081c"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.25.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "efe9e993dccb9d68e06dab611bfc36b0"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "03bc60d040f94d59f9234d20dee210f0"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "427634e75a9241cc3f854808b51104c0"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d3d6e46e1573a131d052d4a8a809933"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "86cc6ce7494fdcc87dedc08e61666fd9"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7acd46d2ec176557e6a923a1f71dba55"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.26.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1b0ca4a2736271af9deeb85f3785f673"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e0395aeaecf379d4999b517de047123e"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2dc39db68b5b2dfefc1679917778fd09"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "992a5605cc94fbaf37a512cda0b9efcf"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e98aeeb02e5c206e84969be9c48854b6"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7d4b4516f376412d32abd1013606fae2"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.27.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a2807bc5935eb942e1817c8fe1b8322f"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d819779db0bde9fa3c1a70f55491c61d"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d3d8819159487ae524710f6a55ef9d2"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "618eb3aeb92661136270d8ec97b0cf4f"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d43fe48134e25129b33918d3a26d5682"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c309b9e8f3b033cdcd66f6ee8db4473c"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.28.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "94af18c8b8fe4d27e28c9c52ad63c5ca"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1da157f2f03c353d2a8582b0d03ad768"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5c4557746e06e32ce52b56d75f0ad06c"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fff58269ba29baebbc874b9c6c4b5403"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d6122af64356560bc287c1125185d663"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37a369325d9983fa3ed0d16de0c0c558"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.29.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "2c0425710d04da33f8b835837eae4f20"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e458229df6e5ecdb10f5f2383ee8f4e2"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7e9041ba5738626f2363819d66f5fdcf"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ca86004b746ebb1f10566cfc6a704212"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3f8d5aa4098028454ed8f9f2b930bfee"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2a75e74802eab2a18541c1abf68e99b"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.30.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9f9a3353e559a79896d1ee4e624fcf60"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7f0da08dbff64b51d6a83a42d6d6283f"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ece3079612afeac7e4f0c3f3cb6494b"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e33a1365da838d45459f80f103e9fc37"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6552ce348c8a047340e42eb3231ecd73"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4d326a209b36ecaac84a9555afec375b"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.31.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3e278836a2028f736eca4befe008e448"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23d4cfe104b485aeda3174d1cea8c6cc"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f914c1e208e39d6e642a57c1ab2afd10"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "860b61044b798014c357ff6f10d9beb3"
+ },
+ {
+ "dataPath": "params_shard_196.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "06fe33bae3deb07dfaeff1634ead9d06"
+ },
+ {
+ "dataPath": "params_shard_197.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57a2edaf53dd318c2dd12130c8f188ae"
+ },
+ {
+ "dataPath": "params_shard_198.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.32.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "f475fcad33025680e317391b2e2b2c6c"
+ },
+ {
+ "dataPath": "params_shard_199.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae993c62edff8bf94208677c0d49a922"
+ },
+ {
+ "dataPath": "params_shard_200.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a3c358b2fe0cac2c3b5a6f9cc5ab5ff0"
+ },
+ {
+ "dataPath": "params_shard_201.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3929388efbdda78ae51cb20caba9e8f4"
+ },
+ {
+ "dataPath": "params_shard_202.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa67735df41736918e8f5feb78f795d3"
+ },
+ {
+ "dataPath": "params_shard_203.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf1265578a5f4cda15619d20aa083162"
+ },
+ {
+ "dataPath": "params_shard_204.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.33.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "cb0a72057d3ad00f41f88f60717674ff"
+ },
+ {
+ "dataPath": "params_shard_205.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c11f4d93900befbc0ee0e1521f525a6"
+ },
+ {
+ "dataPath": "params_shard_206.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62523fc73cdb0b835ed06b69541622bf"
+ },
+ {
+ "dataPath": "params_shard_207.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "126dae4364f9217715e68722ecd0c348"
+ },
+ {
+ "dataPath": "params_shard_208.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "278a6d3012d2ffe18d6ff3de86aae1ee"
+ },
+ {
+ "dataPath": "params_shard_209.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "96a7f432c31c04dbf1a18ecd9227fc7b"
+ },
+ {
+ "dataPath": "params_shard_210.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.34.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "512877b6be9a639179cb63c69f06a1cd"
+ },
+ {
+ "dataPath": "params_shard_211.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bc43df6ca930bf4275f1c70aa4802e07"
+ },
+ {
+ "dataPath": "params_shard_212.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cefa27e004118023dc49e2ef4ae9b669"
+ },
+ {
+ "dataPath": "params_shard_213.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3f76e710be6bf2972494cd7d022d6e12"
+ },
+ {
+ "dataPath": "params_shard_214.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b139a50aad55fc83f6394eeeb29c6f52"
+ },
+ {
+ "dataPath": "params_shard_215.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e29ff26cf3a9bcc5da4844e46db7536f"
+ },
+ {
+ "dataPath": "params_shard_216.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.35.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "a8b3748269d3f95c1d1370e8a8ebdd50"
+ },
+ {
+ "dataPath": "params_shard_217.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bed782fd09e45c347ad559e8e5072ffa"
+ },
+ {
+ "dataPath": "params_shard_218.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cfb21936fd9b599c845b13bd075d9ea"
+ },
+ {
+ "dataPath": "params_shard_219.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2725974f1510c1d403354c7c179cc4d1"
+ },
+ {
+ "dataPath": "params_shard_220.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8becd3bddf39d86a2c6620f4ab7ac2f3"
+ },
+ {
+ "dataPath": "params_shard_221.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b1cb0cbadbb441b3f480f943bafda8e2"
+ },
+ {
+ "dataPath": "params_shard_222.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.36.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c0bec3ec5fb95c5a1e474c7e664b8f33"
+ },
+ {
+ "dataPath": "params_shard_223.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62bd8722614fcb6a85e8acf22c7aabed"
+ },
+ {
+ "dataPath": "params_shard_224.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c748c30de74131e6f2b06724bcc4ce8e"
+ },
+ {
+ "dataPath": "params_shard_225.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "819a332430157c13e368c8c4a1285c9f"
+ },
+ {
+ "dataPath": "params_shard_226.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13e27af78e462080f98a7c6772b77b50"
+ },
+ {
+ "dataPath": "params_shard_227.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9040556dbb3661c7ba114df8368414cd"
+ },
+ {
+ "dataPath": "params_shard_228.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.37.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "725b7c787d7a55cc13d88444c6778899"
+ },
+ {
+ "dataPath": "params_shard_229.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61ac7247c58c2aac5e656029d855a07a"
+ },
+ {
+ "dataPath": "params_shard_230.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e1a9725b87546d033d43533ffa38f804"
+ },
+ {
+ "dataPath": "params_shard_231.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "284d97aa60d5afc1dfd06139a2b28f01"
+ },
+ {
+ "dataPath": "params_shard_232.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "17f81c61ca1da9e1df7db1b736ee82c7"
+ },
+ {
+ "dataPath": "params_shard_233.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79388d186722bf3a3ec58b1056da0b2b"
+ },
+ {
+ "dataPath": "params_shard_234.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.38.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "37c6c9f538b80b2baa78a7a3896bdcd4"
+ },
+ {
+ "dataPath": "params_shard_235.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e7a9e544367ca01a82bbe95427961fd0"
+ },
+ {
+ "dataPath": "params_shard_236.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9e6e53aeb67809933ea41048aad080be"
+ },
+ {
+ "dataPath": "params_shard_237.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5af9f3f393c4bd1c8f37631e2c488d32"
+ },
+ {
+ "dataPath": "params_shard_238.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a38d3c2f0192991b9b38506bd7f3f106"
+ },
+ {
+ "dataPath": "params_shard_239.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4eceb0073e3057b069134f9eff7945df"
+ },
+ {
+ "dataPath": "params_shard_240.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.39.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e68d3c7895452981dd0518a9b44ea776"
+ },
+ {
+ "dataPath": "params_shard_241.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ea6d86343e1855258dc182a800a4d2b5"
+ },
+ {
+ "dataPath": "params_shard_242.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0aa61fbea8a0e31e416deef0c16773b8"
+ },
+ {
+ "dataPath": "params_shard_243.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d778a8241c6a321827742aee3f35b12c"
+ },
+ {
+ "dataPath": "params_shard_244.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15e031314915146ad0e5c014b3de5987"
+ },
+ {
+ "dataPath": "params_shard_245.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e4045c6c5758dadce200c66ad7caedf9"
+ },
+ {
+ "dataPath": "params_shard_246.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.40.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "7278f0271d5dd479d62f1c3439eca83f"
+ },
+ {
+ "dataPath": "params_shard_247.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7dc217df3c8cc97a3744962d5acee566"
+ },
+ {
+ "dataPath": "params_shard_248.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f6f0e9975de5fa8c46628ade3b5484da"
+ },
+ {
+ "dataPath": "params_shard_249.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c03306a51bfa6fe745b7d5d2f9732a97"
+ },
+ {
+ "dataPath": "params_shard_250.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "822fed4f6b5538648ad0042d2841a23d"
+ },
+ {
+ "dataPath": "params_shard_251.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e9fd0ec34ac9759a07281a2b1d8f25c7"
+ },
+ {
+ "dataPath": "params_shard_252.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.41.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "b3fda6a1b99f53cb4ba29d9c514016e6"
+ },
+ {
+ "dataPath": "params_shard_253.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a7c46de7f9fd9bf79d08ccb8b53adc5"
+ },
+ {
+ "dataPath": "params_shard_254.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a835ca06c0839e8d6f5a96ed2bebfca"
+ },
+ {
+ "dataPath": "params_shard_255.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "131d7d71345e3a0078520a1c463600b4"
+ },
+ {
+ "dataPath": "params_shard_256.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5a4a4eaab2c04e8c56024e99f4ec365"
+ },
+ {
+ "dataPath": "params_shard_257.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2451b322968cb0820b4c857937f39ee"
+ },
+ {
+ "dataPath": "params_shard_258.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.42.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "af6878f0a029845d141bd54d41813582"
+ },
+ {
+ "dataPath": "params_shard_259.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "374625e7f063378799667dd3d28791cc"
+ },
+ {
+ "dataPath": "params_shard_260.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae3e41a16e5cf31b113e35a2fdcb17cb"
+ },
+ {
+ "dataPath": "params_shard_261.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e28fd4dc34f1e77922e7711cb84bdb0d"
+ },
+ {
+ "dataPath": "params_shard_262.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24d43470b2a61851f1d0aa724f65ba5b"
+ },
+ {
+ "dataPath": "params_shard_263.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2b6758a378cc7c6a71d980813d50ac56"
+ },
+ {
+ "dataPath": "params_shard_264.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.43.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "4ca2411153668532408d64b41f844e36"
+ },
+ {
+ "dataPath": "params_shard_265.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2611f4a9cb926c71ada5888092ca0034"
+ },
+ {
+ "dataPath": "params_shard_266.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3a98a8e146848847f848164aa9d0312"
+ },
+ {
+ "dataPath": "params_shard_267.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ca9ada01e9a0540a3abc940199e16f53"
+ },
+ {
+ "dataPath": "params_shard_268.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ae823724cf8520b16cadc221c5ea97d9"
+ },
+ {
+ "dataPath": "params_shard_269.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cd901a127dc79e2ed2a764715fbb018a"
+ },
+ {
+ "dataPath": "params_shard_270.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.44.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "d30ad2527e11a540d5ee02e044f28420"
+ },
+ {
+ "dataPath": "params_shard_271.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b19ebcd6bda0f55e1d4f0b376f91767a"
+ },
+ {
+ "dataPath": "params_shard_272.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "dfa8692ad9cd6ddb99cf4e1d496d2c69"
+ },
+ {
+ "dataPath": "params_shard_273.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "46fd1fcaf5489e7e2a10c78a6be74838"
+ },
+ {
+ "dataPath": "params_shard_274.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "adbe51be2b94e9629894b5804e0e9407"
+ },
+ {
+ "dataPath": "params_shard_275.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e57fb8307e7cf8fe2d8b831f8cf4975e"
+ },
+ {
+ "dataPath": "params_shard_276.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.45.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "05c499c5b9d362c3b877635ca39cfc21"
+ },
+ {
+ "dataPath": "params_shard_277.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b6e5f4be3e833a985468ca67e993a1e5"
+ },
+ {
+ "dataPath": "params_shard_278.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8fcffc0ba2a11858a2b2ebc79360761"
+ },
+ {
+ "dataPath": "params_shard_279.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe795e1ffe879aa8e87c2528531c60d8"
+ },
+ {
+ "dataPath": "params_shard_280.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a20e3cc24bb52d6f5b3bd9b99fb1f7b9"
+ },
+ {
+ "dataPath": "params_shard_281.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f2ac52a6590269469fd50fcf884cd508"
+ },
+ {
+ "dataPath": "params_shard_282.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.46.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5ac56d3c461228107ebee3911676919d"
+ },
+ {
+ "dataPath": "params_shard_283.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "663c3f34e89b5b517bb381fbfe7557ac"
+ },
+ {
+ "dataPath": "params_shard_284.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d4982bd9762ec3aa8d6fa40208c143dc"
+ },
+ {
+ "dataPath": "params_shard_285.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5c0b8f0e14b6d20379753bbeb29ea36"
+ },
+ {
+ "dataPath": "params_shard_286.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a29cbee9a62d505d7a6ae1e9593e7ed1"
+ },
+ {
+ "dataPath": "params_shard_287.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac4b080929fc92ec0e9a6d2066712e61"
+ },
+ {
+ "dataPath": "params_shard_288.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.47.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "438f04bd27d7883939b2822cd82fc9f4"
+ },
+ {
+ "dataPath": "params_shard_289.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9597f604ee79e59e3233da7d887cc667"
+ },
+ {
+ "dataPath": "params_shard_290.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25c626e13186bfb968a027b8ad75669f"
+ },
+ {
+ "dataPath": "params_shard_291.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9aa82634e22ce3364646ff4ee282843c"
+ },
+ {
+ "dataPath": "params_shard_292.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16c081950fb0a203c7fe517221bac632"
+ },
+ {
+ "dataPath": "params_shard_293.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b75130a9426cc5878ca7adc37feb5d06"
+ },
+ {
+ "dataPath": "params_shard_294.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.48.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.48.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "67183418d9b0584f5709593da8b4067f"
+ },
+ {
+ "dataPath": "params_shard_295.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9889d460341c02d901966596bf262cdc"
+ },
+ {
+ "dataPath": "params_shard_296.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7c22439b8a2ff2cbbc205a820e68988e"
+ },
+ {
+ "dataPath": "params_shard_297.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "24bd92886bf03a9360245a7b415f8013"
+ },
+ {
+ "dataPath": "params_shard_298.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "07cc9229afe6edc077bdb3a397051d0d"
+ },
+ {
+ "dataPath": "params_shard_299.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4764653c765376f01e1f11148f024c00"
+ },
+ {
+ "dataPath": "params_shard_300.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.48.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.48.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.48.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.49.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.49.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3a047aeb9c0455902eef0084424d05ef"
+ },
+ {
+ "dataPath": "params_shard_301.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e35827193c0dd5e8bba0c6d37d179b06"
+ },
+ {
+ "dataPath": "params_shard_302.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "37bdea87bd37d94a0af44cba9d6916ff"
+ },
+ {
+ "dataPath": "params_shard_303.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5b3d8d72605fc3ba49ef5e458593a24"
+ },
+ {
+ "dataPath": "params_shard_304.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87a7707a1f51ab39f09ee8da7701c9df"
+ },
+ {
+ "dataPath": "params_shard_305.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5ab4d4423853cd949d394c0a7dbc5e2e"
+ },
+ {
+ "dataPath": "params_shard_306.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.49.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.49.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.49.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.50.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.50.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5008d6497bda2c5bacc357c4975d84dc"
+ },
+ {
+ "dataPath": "params_shard_307.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "898769e571cfbbe506662c5af71fd627"
+ },
+ {
+ "dataPath": "params_shard_308.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "67caa3dfc7f6df3c7bc411429a957034"
+ },
+ {
+ "dataPath": "params_shard_309.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c12ba3baecf6319317e023fc4ea1236d"
+ },
+ {
+ "dataPath": "params_shard_310.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "642c08c68d1456774cddb62d0d1d37bc"
+ },
+ {
+ "dataPath": "params_shard_311.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce5207136300d3fe4a0ab9f5b523c136"
+ },
+ {
+ "dataPath": "params_shard_312.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.50.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.50.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.50.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.51.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.51.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "28e733c6c84e569f87697b2a7a48bfaf"
+ },
+ {
+ "dataPath": "params_shard_313.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4e5987d3244c48b3aa0d46d1ceee2951"
+ },
+ {
+ "dataPath": "params_shard_314.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a173c5c565bc1892cfbfd258c1cb6289"
+ },
+ {
+ "dataPath": "params_shard_315.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25394fc7a51a99827c101012ac3f5f19"
+ },
+ {
+ "dataPath": "params_shard_316.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b6f6ab4f9a40ec72cc039bb6840550bf"
+ },
+ {
+ "dataPath": "params_shard_317.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1bdc90db1498982bf164fb79785c876d"
+ },
+ {
+ "dataPath": "params_shard_318.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.51.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.51.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.51.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.52.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.52.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0cc4e820530177a74513adb27afbd9c8"
+ },
+ {
+ "dataPath": "params_shard_319.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fd96917f49ea5f021c4c33d30bed32b4"
+ },
+ {
+ "dataPath": "params_shard_320.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "41c50491e9d060338cb630ab2ba88999"
+ },
+ {
+ "dataPath": "params_shard_321.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bab4e1a1288bd5314754b46774495237"
+ },
+ {
+ "dataPath": "params_shard_322.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7c13baaa72e3f7916d895b1ec526977c"
+ },
+ {
+ "dataPath": "params_shard_323.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19f2d96ab3750265f7f12328aae4b322"
+ },
+ {
+ "dataPath": "params_shard_324.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.52.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.52.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.52.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.53.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.53.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "01882d19d9896aa4f0e2f684bed12034"
+ },
+ {
+ "dataPath": "params_shard_325.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8b466389d5e67a19cfaf0cbe6dd8ba37"
+ },
+ {
+ "dataPath": "params_shard_326.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6e8acffaf0096d5dfdb61a156a7fd4a1"
+ },
+ {
+ "dataPath": "params_shard_327.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3b953a0e2f17d9d48281e62021524013"
+ },
+ {
+ "dataPath": "params_shard_328.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9a1a10b192e1f02c27370661bce28fb8"
+ },
+ {
+ "dataPath": "params_shard_329.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b2d3f3e3b1e39e0f79967860b7eb6a76"
+ },
+ {
+ "dataPath": "params_shard_330.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.53.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.53.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.53.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.54.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.54.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "774dc85439307a856b0fc4c7aeb20f18"
+ },
+ {
+ "dataPath": "params_shard_331.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e50be005424bc55d474087735ecc75e6"
+ },
+ {
+ "dataPath": "params_shard_332.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ccd3056e2ec39fec7e2252ebb7b5201"
+ },
+ {
+ "dataPath": "params_shard_333.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "894f23f697dbc67bff0d490bfe3c6ca8"
+ },
+ {
+ "dataPath": "params_shard_334.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a4794ec700952f23bc76220dd1d76ff4"
+ },
+ {
+ "dataPath": "params_shard_335.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5e2c4c525807a481f26cf25492a2f479"
+ },
+ {
+ "dataPath": "params_shard_336.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.54.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.54.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.54.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.55.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.55.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "72d56789d090541ff4e311d0a2136035"
+ },
+ {
+ "dataPath": "params_shard_337.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a22693c144d25c14ea4c4878c8ef0c06"
+ },
+ {
+ "dataPath": "params_shard_338.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63403d019ae94759c582efce72f9cc56"
+ },
+ {
+ "dataPath": "params_shard_339.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b20eb650134daeeca6eb08110c219595"
+ },
+ {
+ "dataPath": "params_shard_340.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8bfc35a9009de9225c3a12cb196e7954"
+ },
+ {
+ "dataPath": "params_shard_341.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a19d8cc746138a7b60884b207ad28ded"
+ },
+ {
+ "dataPath": "params_shard_342.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.55.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.55.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.55.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.56.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.56.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0ee1f7a8f52a37163816027cd8631d7f"
+ },
+ {
+ "dataPath": "params_shard_343.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "507c3daa67d84b90e930c67fa52a15b5"
+ },
+ {
+ "dataPath": "params_shard_344.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "db67da53b6209bf7ff8448563296d6ef"
+ },
+ {
+ "dataPath": "params_shard_345.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "67e3c67bd2a84887ba16228e28dd0ac1"
+ },
+ {
+ "dataPath": "params_shard_346.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2f6fade64d07f3ca3fbb3d257a49535a"
+ },
+ {
+ "dataPath": "params_shard_347.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16925bb2bfc6d13779512a252839c5b9"
+ },
+ {
+ "dataPath": "params_shard_348.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.56.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.56.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.56.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.57.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.57.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "e03fe4d8fb5783798a74f2b88bb22f6e"
+ },
+ {
+ "dataPath": "params_shard_349.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9294f9b7199e1d8c3917ae043d9f5ff1"
+ },
+ {
+ "dataPath": "params_shard_350.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9fb78979622f2d2d1d60af9ebf040934"
+ },
+ {
+ "dataPath": "params_shard_351.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5439d9cc96994bb3978b2bedd1661a30"
+ },
+ {
+ "dataPath": "params_shard_352.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a1d1883a4127ea2ca97161a38e77357b"
+ },
+ {
+ "dataPath": "params_shard_353.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8f52ab478c45d46bfe5c1dbcca973ea"
+ },
+ {
+ "dataPath": "params_shard_354.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.57.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.57.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.57.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.58.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.58.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6bae95a7fbc2f6b207dc1b34143986df"
+ },
+ {
+ "dataPath": "params_shard_355.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "62c686f0eb51e72b81732e4d0fa48e04"
+ },
+ {
+ "dataPath": "params_shard_356.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4a29ade65ec4c06248fa509a9dddf7e1"
+ },
+ {
+ "dataPath": "params_shard_357.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "28bed2c7b3b1ecdf4b4d84b6c8093498"
+ },
+ {
+ "dataPath": "params_shard_358.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "26bba2dd3ca1f5993730a127ec469c31"
+ },
+ {
+ "dataPath": "params_shard_359.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79b165d2163381b9f2946e97c33b877c"
+ },
+ {
+ "dataPath": "params_shard_360.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.58.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.58.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.58.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.59.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.59.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c9c3584887279af8aa8975b33630dcbe"
+ },
+ {
+ "dataPath": "params_shard_361.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5c35e28fe19aeac8809ca6fbc65812c"
+ },
+ {
+ "dataPath": "params_shard_362.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "46abccbeaada7f1686efa4d572f2288a"
+ },
+ {
+ "dataPath": "params_shard_363.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2bfaf5563c4b8eb5ce36b2894be64da0"
+ },
+ {
+ "dataPath": "params_shard_364.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7ea0ed2d45a0289cda776e163eb62f60"
+ },
+ {
+ "dataPath": "params_shard_365.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acb215a9fb8d817566ec255a88741a4a"
+ },
+ {
+ "dataPath": "params_shard_366.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.59.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.59.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.59.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.60.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.60.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "24031b013402757a95b725d1d58c624b"
+ },
+ {
+ "dataPath": "params_shard_367.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "57b888959c536bcb8bf205cc7b50152d"
+ },
+ {
+ "dataPath": "params_shard_368.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d4be0bfad9a37360e8265ebb8312f851"
+ },
+ {
+ "dataPath": "params_shard_369.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa014397cc342d8cda1359d485dbc65e"
+ },
+ {
+ "dataPath": "params_shard_370.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fc9fa177e2d442e80b365be7a2db9a92"
+ },
+ {
+ "dataPath": "params_shard_371.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "acfa98e682d887344f9b823ed57c7eb1"
+ },
+ {
+ "dataPath": "params_shard_372.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.60.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.60.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.60.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.61.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.61.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "9ac014c4df99567e2f0d5756e989a56e"
+ },
+ {
+ "dataPath": "params_shard_373.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3d0caab08ff06305cbc7f314eb1b63c4"
+ },
+ {
+ "dataPath": "params_shard_374.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "03b557a65f7c6d9989c6979c272f4110"
+ },
+ {
+ "dataPath": "params_shard_375.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5cfee4396006c3232b8e5cbc4195e4ce"
+ },
+ {
+ "dataPath": "params_shard_376.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "01068ac29c21f9bae4d47f07afcbd742"
+ },
+ {
+ "dataPath": "params_shard_377.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84734260cde97db9b2a28884fb51840c"
+ },
+ {
+ "dataPath": "params_shard_378.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.61.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.61.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.61.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.62.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.62.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "4721356a89e76fae03225dc166c64b45"
+ },
+ {
+ "dataPath": "params_shard_379.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2bd737a0768c57fc61767eedd3da1b24"
+ },
+ {
+ "dataPath": "params_shard_380.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "775c04cdade416b12a90f76182a0e236"
+ },
+ {
+ "dataPath": "params_shard_381.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "13e2e18669fa832fef5c03d4b7bf7af0"
+ },
+ {
+ "dataPath": "params_shard_382.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ebf12e03b354719fb76bf41855d9cca5"
+ },
+ {
+ "dataPath": "params_shard_383.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4e2c7dfd6c7106cab04e9789c51b7ce0"
+ },
+ {
+ "dataPath": "params_shard_384.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.62.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.62.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.62.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.63.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.63.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "898ed8bebc824047cc7b661d3ecefaa9"
+ },
+ {
+ "dataPath": "params_shard_385.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5f3ecdee3ce4233813abedf394b394e1"
+ },
+ {
+ "dataPath": "params_shard_386.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9113a6c2931b3e2729e6872f9e273d60"
+ },
+ {
+ "dataPath": "params_shard_387.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6cda3ba42c9dd2b0dfde3c0da425afdc"
+ },
+ {
+ "dataPath": "params_shard_388.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "951e7a961c4b2f401a35777ef037b17b"
+ },
+ {
+ "dataPath": "params_shard_389.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "227f7680ad6a40274c63e35d1a4dba94"
+ },
+ {
+ "dataPath": "params_shard_390.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.63.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.63.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.63.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.64.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.64.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "890e02eb523a0696740e51737221a9c9"
+ },
+ {
+ "dataPath": "params_shard_391.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "89bec5040dddfe37b27f8d40388b075b"
+ },
+ {
+ "dataPath": "params_shard_392.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "16da05d32abdb1ab271f1b8a3e9487d3"
+ },
+ {
+ "dataPath": "params_shard_393.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6b519f1b4763fc05c1518c9daf5c62e6"
+ },
+ {
+ "dataPath": "params_shard_394.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5c2491aafa5d89eaee143f8986625202"
+ },
+ {
+ "dataPath": "params_shard_395.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f1388f14b8986ed0a660afd2dc29b339"
+ },
+ {
+ "dataPath": "params_shard_396.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.64.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.64.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.64.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.65.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.65.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "dd39b8a131088968d99fb6a49a31f3dd"
+ },
+ {
+ "dataPath": "params_shard_397.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe1799ce3b4f78bb76b2fc7b012ad469"
+ },
+ {
+ "dataPath": "params_shard_398.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2961a9e76013f4cc8cdbb438893d7f38"
+ },
+ {
+ "dataPath": "params_shard_399.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3ca2f5aef783f3434a52c1be376c5beb"
+ },
+ {
+ "dataPath": "params_shard_400.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1d2d2a9ff595a15e18a1cb12f0e261c5"
+ },
+ {
+ "dataPath": "params_shard_401.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c6487217b5ca1d13e465239815e7d226"
+ },
+ {
+ "dataPath": "params_shard_402.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.65.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.65.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.65.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.66.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.66.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "1ab701cd78af3b96f24c728dae932c19"
+ },
+ {
+ "dataPath": "params_shard_403.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64346add10c58ec087a6e2bad28ca61e"
+ },
+ {
+ "dataPath": "params_shard_404.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4512af4fdcd68d523299ecef9c3eb1ee"
+ },
+ {
+ "dataPath": "params_shard_405.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63ea311ecab57d56745039d9a5e44b25"
+ },
+ {
+ "dataPath": "params_shard_406.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "52243cbe67bf1680d3c2952996cb67cf"
+ },
+ {
+ "dataPath": "params_shard_407.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8836abae906061db23356323834aa9f"
+ },
+ {
+ "dataPath": "params_shard_408.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.66.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.66.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.66.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.67.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.67.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "3493add60010de68c1b0a1db8642f568"
+ },
+ {
+ "dataPath": "params_shard_409.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d0362e21e91beeed36049e3cf86036d0"
+ },
+ {
+ "dataPath": "params_shard_410.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d06c6a731f5cb92546bebb797c3e8ee0"
+ },
+ {
+ "dataPath": "params_shard_411.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d3d4f562b872fcf671348de7958ba5e0"
+ },
+ {
+ "dataPath": "params_shard_412.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "392c6246e17701d8d58f3c9519fdf246"
+ },
+ {
+ "dataPath": "params_shard_413.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7d9917f207a7971d0be89a473d6d8a2"
+ },
+ {
+ "dataPath": "params_shard_414.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.67.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.67.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.67.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.68.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.68.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c4f23fb0c836de7034aaf5174e1b3993"
+ },
+ {
+ "dataPath": "params_shard_415.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1a1ef7b4b4311054fac6ddbfa332470a"
+ },
+ {
+ "dataPath": "params_shard_416.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b943175c25499b4aa81d59703a90c36c"
+ },
+ {
+ "dataPath": "params_shard_417.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80d85f785d6f039f694ade4180f5233e"
+ },
+ {
+ "dataPath": "params_shard_418.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "312b0ea77ec14fc0c9a2b3c730fa8a22"
+ },
+ {
+ "dataPath": "params_shard_419.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6d6095a425e03e721d25322d6bbdb313"
+ },
+ {
+ "dataPath": "params_shard_420.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.68.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.68.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.68.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.69.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.69.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "5907ba7f58fe04573480c56805cd06a3"
+ },
+ {
+ "dataPath": "params_shard_421.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e22ff8ce332a0a73082cc7ded803b0a6"
+ },
+ {
+ "dataPath": "params_shard_422.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "701fa19f952ffea454247cf52683c941"
+ },
+ {
+ "dataPath": "params_shard_423.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d37d1e41eb2c537081ea3da7a56fb83f"
+ },
+ {
+ "dataPath": "params_shard_424.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0a383acfadd7e07f5efbe8339b1ecb78"
+ },
+ {
+ "dataPath": "params_shard_425.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f05866dbb3cd92594a0a4ea098181859"
+ },
+ {
+ "dataPath": "params_shard_426.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.69.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.69.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.69.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.70.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.70.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "6cf50e9a91ef7182e0d4f9c14a7aebd0"
+ },
+ {
+ "dataPath": "params_shard_427.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "04592ca0cfa5ad637d7b707b3806d1f9"
+ },
+ {
+ "dataPath": "params_shard_428.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "77f73fa70592063a146c366942b6da09"
+ },
+ {
+ "dataPath": "params_shard_429.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "106e2e5288c084fdf24cb38606a3f6ff"
+ },
+ {
+ "dataPath": "params_shard_430.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b5f0bb8c86151fb049b73d0257f49934"
+ },
+ {
+ "dataPath": "params_shard_431.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fe705a93811b97d41e68467724808329"
+ },
+ {
+ "dataPath": "params_shard_432.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.70.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.70.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.70.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.71.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.71.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "77aef38e7f0bf3439ab56bfae82b2446"
+ },
+ {
+ "dataPath": "params_shard_433.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "205573efdcf20a2a6f05971b038aa69a"
+ },
+ {
+ "dataPath": "params_shard_434.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6340eaa9051ce7af8695f9c70e9ca666"
+ },
+ {
+ "dataPath": "params_shard_435.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c06b6f430a54095335b4bd3feb9428f"
+ },
+ {
+ "dataPath": "params_shard_436.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f24d07886cc45c582461dafe8f3992e3"
+ },
+ {
+ "dataPath": "params_shard_437.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9787e9629802560c47975b2246026c72"
+ },
+ {
+ "dataPath": "params_shard_438.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.71.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.71.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.71.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.72.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.72.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "eff87eb8df2fd9d416ac8fcb82ddc0ac"
+ },
+ {
+ "dataPath": "params_shard_439.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1c344c707efc2fe7949af5faab0fc97b"
+ },
+ {
+ "dataPath": "params_shard_440.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9e6d164781f9f01e1a1fb6eea09727b"
+ },
+ {
+ "dataPath": "params_shard_441.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8d6b5201fcf0b5e4589add90db02c2df"
+ },
+ {
+ "dataPath": "params_shard_442.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99be8f8ee7317bda642e36efd4b74633"
+ },
+ {
+ "dataPath": "params_shard_443.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0da75744c385e5b76de32f2aea078a2d"
+ },
+ {
+ "dataPath": "params_shard_444.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.72.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.72.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.72.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.73.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.73.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "987169a64c7af0b910d9f9c40c08a1cb"
+ },
+ {
+ "dataPath": "params_shard_445.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "047612ebde13b6d550d4878147e5ae0c"
+ },
+ {
+ "dataPath": "params_shard_446.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "669694bce70a0a7bcc7f80797884ddbd"
+ },
+ {
+ "dataPath": "params_shard_447.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87e6936a91fc544a2ebd06246fc21adc"
+ },
+ {
+ "dataPath": "params_shard_448.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d5fd7ab14db07f7450e499daf593d209"
+ },
+ {
+ "dataPath": "params_shard_449.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "79add4990b5f75f0954b9adc81a40bc5"
+ },
+ {
+ "dataPath": "params_shard_450.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.73.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.73.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.73.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.74.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.74.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "0946db163b8643fc06667225f843a26e"
+ },
+ {
+ "dataPath": "params_shard_451.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a7ac0342ba94f26e80257cd4aeca0883"
+ },
+ {
+ "dataPath": "params_shard_452.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "66201ac4a8933ce649713bfceeae54bf"
+ },
+ {
+ "dataPath": "params_shard_453.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8707b316c631457c70bd6c1b628cc64"
+ },
+ {
+ "dataPath": "params_shard_454.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64d094fc97af0753742b339583737dc7"
+ },
+ {
+ "dataPath": "params_shard_455.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "09ca1a590ceb8711607a1a0a0dd51832"
+ },
+ {
+ "dataPath": "params_shard_456.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.74.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.74.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.74.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.75.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.75.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "adb4defec811675b023e97de7eb7c733"
+ },
+ {
+ "dataPath": "params_shard_457.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "947913fc58477ab9ffa47a5b89894d65"
+ },
+ {
+ "dataPath": "params_shard_458.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e2e6f1c52accfcfe9d82f10960dea6b5"
+ },
+ {
+ "dataPath": "params_shard_459.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "590199dca2c197446fbb85bd3ca43baa"
+ },
+ {
+ "dataPath": "params_shard_460.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbcff28d1dbe1a67149eedbd0014372d"
+ },
+ {
+ "dataPath": "params_shard_461.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a9923af4b76a2e3e65e4861adb27d977"
+ },
+ {
+ "dataPath": "params_shard_462.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.75.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.75.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.75.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.76.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.76.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "c4ce9d733ba438afc2a724c135593f36"
+ },
+ {
+ "dataPath": "params_shard_463.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "244fb13d822be6c7d06898a735e60559"
+ },
+ {
+ "dataPath": "params_shard_464.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a5853e7acdf93790a330f47580bfa51e"
+ },
+ {
+ "dataPath": "params_shard_465.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0d5c22a0a5988d73d09471d89fc163c0"
+ },
+ {
+ "dataPath": "params_shard_466.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "18acd8799ca326ebbe3a2aff29e6e3ff"
+ },
+ {
+ "dataPath": "params_shard_467.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7342c731c9ff15c5adaba8edf7b4be16"
+ },
+ {
+ "dataPath": "params_shard_468.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.76.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.76.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.76.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.77.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.77.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "cdd8135716bd2dc5b535341e3eac820c"
+ },
+ {
+ "dataPath": "params_shard_469.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8c80f59c4df01148f9c7aa0b4c025c2"
+ },
+ {
+ "dataPath": "params_shard_470.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "811de3bfa66f2f8b5dd4543560fc9d21"
+ },
+ {
+ "dataPath": "params_shard_471.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61877e6bbdce8abddaa443d87579ad99"
+ },
+ {
+ "dataPath": "params_shard_472.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6866e9fecdfe546015f91f43a79ab4ce"
+ },
+ {
+ "dataPath": "params_shard_473.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a980cbc566cf413ef9ae6dcfd704e874"
+ },
+ {
+ "dataPath": "params_shard_474.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.77.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.77.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.77.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.78.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.78.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "bff4bb2bdb94554add45ff8cdd05d1e6"
+ },
+ {
+ "dataPath": "params_shard_475.bin",
+ "format": "raw-shard",
+ "nbytes": 41943040,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_weight",
+ "shape": [
+ 10240,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 41943040,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "531fb937911ccee7083556ee675b6b14"
+ },
+ {
+ "dataPath": "params_shard_476.bin",
+ "format": "raw-shard",
+ "nbytes": 33554432,
+ "records": [
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_weight",
+ "shape": [
+ 8192,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 33554432,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "40962de371c53cf1376f752638a77bd8"
+ },
+ {
+ "dataPath": "params_shard_477.bin",
+ "format": "raw-shard",
+ "nbytes": 234881024,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 57344,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 234881024,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "935323b86bd8a4818704bb722b125f78"
+ },
+ {
+ "dataPath": "params_shard_478.bin",
+ "format": "raw-shard",
+ "nbytes": 29360128,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 57344,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 29360128,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42678600f504d0ef41c6cc1537a33354"
+ },
+ {
+ "dataPath": "params_shard_479.bin",
+ "format": "raw-shard",
+ "nbytes": 117440512,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_weight",
+ "shape": [
+ 8192,
+ 3584
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 117440512,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c115c02ed782ff7ff9a7cfed9d686064"
+ },
+ {
+ "dataPath": "params_shard_480.bin",
+ "format": "raw-shard",
+ "nbytes": 24150016,
+ "records": [
+ {
+ "name": "model.layers.78.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.78.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.78.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.layers.79.self_attn.qkv_proj.q_scale",
+ "shape": [
+ 10240,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 5242880,
+ "byteOffset": 14712832
+ },
+ {
+ "name": "model.layers.79.self_attn.o_proj.q_scale",
+ "shape": [
+ 8192,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4194304,
+ "byteOffset": 19955712
+ }
+ ],
+ "md5sum": "fff910192a63a35b8b64b2ad87e7fa09"
+ },
+ {
+ "dataPath": "params_shard_481.bin",
+ "format": "raw-shard",
+ "nbytes": 525336576,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 128256,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 525336576,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ffb9a4821e85c82ea4b4036509e192c1"
+ },
+ {
+ "dataPath": "params_shard_482.bin",
+ "format": "raw-shard",
+ "nbytes": 65667072,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 128256,
+ 256
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 65667072,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "42dcf5cff51f226c09e1243f3df821ad"
+ },
+ {
+ "dataPath": "params_shard_483.bin",
+ "format": "raw-shard",
+ "nbytes": 14729216,
+ "records": [
+ {
+ "name": "model.layers.79.mlp.down_proj.q_scale",
+ "shape": [
+ 8192,
+ 896
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14680064,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.79.input_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14680064
+ },
+ {
+ "name": "model.layers.79.post_attention_layernorm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14696448
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 8192
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 16384,
+ "byteOffset": 14712832
+ }
+ ],
+ "md5sum": "f266c5ce63191a16a76da09c5e11b48a"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2de99a70b80d85d97f69d0cd733674e71cd2067
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f06c49ec973144f3bb407cb37a1d20f157d59c11aeefbf034a506d09565ce4a
+size 525336576
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cad7c5fd9a46571b143aabd32becae8aa9b7dfc
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:de198c859282d07e302964c39cc56fb945efb86e1b4702ac2f4dedd6faace2e2
+size 65667072
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b9dafa836d2d00ee0b1800f2bd6a48f9489afdaf
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b491290f229b7fdfc4d434d832c2d0c5b66fe9e108fa410c26322fe7ce6e7476
+size 234881024
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c63f294fec0ff89cac8853804eee878ab4ab6c21
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52596a8ce9588eb777f663e3f98789308bd70db2056be332dd8cca84d34482e6
+size 29360128
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..85d252cc59d989d6d5ac1af90a35483174f523b4
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b3a7334639f873efa6e66a92d568a6011a98a698dc2531869b0183e810441da
+size 117440512
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a48ab544fe9cfa3b3e053ed48c7643e888298003
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a58dbdb5a782ce874b0df662d2f487c1d1f0289a7a758b4af77e3da33dd60d38
+size 24150016
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eeeeb9b772f10d1ccf6a3f8354132536b270caff
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70d9f6e2d3a6162418e2f404ec14c0db85ddfed3bd1e143ca820b428a521f535
+size 41943040
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..be224c589d68ff5a0af37fabe1e13d08f566070a
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c8188114191521ffd512c990602d9b29a57dac4548035a51808660d3e3dfa73
+size 33554432
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b49c859ba4fe8ba2ee7ca4c4453ae4940cccd09b
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0810abf4e1a45157b4a8aab7aedcece7d139abb6bb194aaec028b4ca16af8029
+size 234881024
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c409d59014126df657b1f9e0ef616820d63f416a
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3563a5a62de1a70dabe9a13ca4c664c9471911b070f347340c2a0ba5cd35f7dd
+size 29360128
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b0b41893b2b559ce6e508ec2c4ebf45de388a12
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:072e0408c2763c40f5b7ff73aa790fdf69288263b5858aa1993cf37e864a4db8
+size 117440512
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..22ef04e8099d98479d12baf20912ea240a7a0e6d
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:721cb657946b6b2a92c2e756a25a1a67bb5781ec2838e7cc93ee49799daf049d
+size 24150016
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fbbe1139e7efa349761320d1a7629acaa6741634
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:06c2fc07ee4a01f73fa90ec4c1397335e484ae26bfd3b10e03423469b5bbedc1
+size 41943040
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e82e9b2c55f8ed0e1ebaddb7a815f202947f4bb4
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7b1b3f1bb0bce26b6422ee02999108a88c74f9e637124b1f347157b8632fb0c3
+size 29360128
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d29793b1f8458fb2852d565120f446644f72229
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:740f7b8beb92976a574b984ba43eea061da965b10d9e3af52d5618097a2ce257
+size 33554432
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aae0cae6f9b85a6fcdd6a7c7343a58cd024a2450
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff342cd518af5ab830dd42b044f379af56dcfdb549e5d0c2c304d5c95e4cf60c
+size 234881024
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b40ad178b9fb30c0fb478980e2f639fec09d6819
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ab2cca2afb121d1cfac4681c37980a2cdb19627209d86e4edd0ea789c76ed57
+size 29360128
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a668642e31e9d103763d350514140c581d2b537
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d538c8df5ed4381c69ba61f568f7be890d98b7cec47d0d25788ed924fe35e68e
+size 117440512
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8589b178e77a30f3a6352c9e75f15dbbeb2c2ca2
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:227f0ef6c2de6f74c0fba1c1220b5315856d2b7d60e8edae0cf644ceb1f2c0cb
+size 24150016
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..28a6606ea2c3441e25c0786cd9f0d1f8eca962a0
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80ac99e5c0cfed4c71431c908b9441f87ece53159bd69106e0d75a1253ad8e69
+size 41943040
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..288519868d6e7b4ca7461e5095be18ed09281878
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d694c4bf9095a12f66ed61ba9708bf9cd5bcfee5b02e8dfa6e75d57da83591de
+size 33554432
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0616b8845521625b0867858f6c755ed7441d5176
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aa1ec753c5de887ab9fd5ceaa7d98b0851867b79e80ea345c5bac66e7eb6369b
+size 234881024
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d0d0be34785a76f15381571f8f257598e0a958ea
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:613b77d65a81f724e66b01e9436d4b1eb80e65d4f702fbcde1b6d54775be961d
+size 29360128
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..61ccc5f0615b58494a6390338c54a0e53ab34c2e
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9b1713e84ea9d98b67a62ea540cbf6df46ab0b389ebee407920a9aaf22b9b6a
+size 117440512
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2248b0b06d6fe13c914a769afe041ef0c437e50c
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a65930efa2593f2605f6986ccea46036a1f311c2be672b87a454562b8ff0b75
+size 117440512
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0010dddc25b2ca4cdda1f6d93320ca2f94df0064
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3523c3c2281297440b224117a53b20ef019ae5945237b4b34835d05477e4ca2a
+size 24150016
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b80696a18c1126c441c2df0b37ce7770ed41cfaa
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0b7cb6bf928d2e970050b7981aed9aa09a214ff22057301e9739760e697d6a6f
+size 41943040
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8aa3e6fb9fa9db2cf53c9baa4ca7dbb47f3081db
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2cc045e6234215c3f2ca4f3cba9a712dfe3044797d0a7a2fc3bca4945fa7dac3
+size 33554432
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d854b350152ef49f4d914b4ca7bbcb4fd5eb473
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd486edbad5f3534ae1e5ae35b588fcbc9d98a3abf31e3c45c0e69fae094d324
+size 234881024
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e71f396156922c11b791ef60f729fd65eb7dee0
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4117d7b7e6f264aee86da7a55348a21424e0264ddeb7341e7971f0d8f1532d26
+size 29360128
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b543da4450139c9a5892d0a375b6387fb0cc19e7
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ef76583a942e575936cd8ccb378d0154c857c94ae1eb4bfe47cb4c99edff271
+size 117440512
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..738ff56828ea944e8ab6718196720be4a53554be
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:662f4d00bf7eb1b36c6b7da19afc59d87e845b68eef155a149c7d82d513c9f9a
+size 24150016
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..460a53b44ffcc83f5ca67c64c196bd7721343753
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0947fc5b9c677832bd12a590e3de8289fdd8c2bde8261a7c45396db605d4cf7
+size 41943040
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f211d1ee50b32819d38da05aae8b23a5e3641c50
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e0bdf4643278b87e02350a8984567ae1d7a218f73198371ac88f230f225d8dd
+size 33554432
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee818251a7febd0d1355d0dae524923023a6a57c
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:089434e0802f9e8edcb41a287e21d54eea618f399307b116e1c8a184d4d3fe0d
+size 234881024
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b24d1840a659ddc6a2e5518f09ce9945d5f5a794
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4516288dc15756c349c34bdfde47cf74390c9340c0e9b39ebf8e35eb46be063f
+size 41943040
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d8e14f9c93e1f0f155202edb07b44f95d557fa5c
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be107305fa3179cb34a8d8ff62399c1a5e36eaaf465a2b471fb580c05ac12475
+size 29360128
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..123a8d95b1893f3bce6d4f6b48557b1a796736ed
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:65bc20b1878eea63eed93c142284a87de56abccc93fe82349bdf6d8b0def6364
+size 117440512
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6de7e314999580c68781b30a2b9d124f1b5ae764
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1fe38c74de656d97a7e3fa4e9e068e4750a1955ac4800eec42a08240c2a4206f
+size 24150016
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d3ca70f6b3a3b26377dd6be47e6a79d357a8d20
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37b1ace92132f0b4ad52777021a412c32762025c5fb72604ad5a6bc0b50fe975
+size 41943040
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e1321670404411debac6bc37a7eea917ca614afc
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aa72d08bdf084090a1f07d08b26df346835cb37a92c32daf5f24751857b1dfee
+size 33554432
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30c368ebe1609c5dee2d9e3b030a99ede300c237
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc708eea0a71e69caf8a24a4ad55e104b36a5de57747d3804a14a7c26c3a805d
+size 234881024
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e62eee8f0b4801eb79feaf5116cb8747da8bf0d1
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1696e0cf512990f8906bb03bd95ea5a4ab147e6623ef3d50af4e33c25499a976
+size 29360128
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74f7f15c1a67a6c92b53867d920c215d7a60fa0e
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be24d99d33db858fdaebebf725d3480f1bfd1236449fba59d3a5f1a1d447f03a
+size 117440512
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ce0b72bd46913251b2012c50da6579b601db8e9a
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd0bf176d530fdc3e6ef8994638e1d104009d04e3a16b0e725cdbd2fd6a00fc0
+size 24150016
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cad52682710fe1e878b579bacc5c9a938e8ffec6
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48a0456b539b68efb4233cbd33be15dcab386ddd38c2b706c14f7ae2127672b6
+size 41943040
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..456e0c0ea0a72079ca2984c6a92be6ab84ced44b
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd8bcf619427a3f85220c1b1b1701ce19eb35ab4b5c29fd816d217c55e943485
+size 33554432
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..afb2374437fbbf794e87bce0b5a8eca0ec36e11d
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d655973a8c624b272e11b9d7f70326b11f5734d555437b452bec7c3e027c8fd
+size 33554432
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf0118390ae1b7bfb6e5aeb1ff4277c67ae854a8
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43e93307a4d6153f473a6cc709ed799fa77ef8ed442f8c2a46a17a4d9084bef5
+size 234881024
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6297a5c5481d2c0f0d45a905cd65450a431324ab
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2141178a208ec9089fa2656eeeae74ec5fe23e7e1a6643067f88284bd606992
+size 29360128
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0391685045f9b7bcdc371c4596b109aa0206c8a0
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9fe90c2f955ad26501cb4c4e19cdb9ac003d80bcba05b4a9d98ffbf7b96d801f
+size 117440512
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a4bd99e015ffe30a86caefe9c90b7d4831a07dc
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4e5ecafc7830fd231c73392cd9b88fdc30d9f6ec16c2c6d3b285df7aa8d5751
+size 24150016
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fe23bbc420dbd0fc6c754d3739904aacb6abfdd8
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b874b45ea6ce93279597126fa4f2e0f4e9aaec1d10312cb139c936b99a2c5db7
+size 41943040
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54ce44eaa9b9372161e0a0103c452ace8021a662
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:419bf8d1647e6789139754d7a40c2d5a6138a49aec09dfbdc85066dc5eab6cf4
+size 33554432
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1319264895916baae174ea97fcadf4f922396c51
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dcb33f7d1665fad824daac0fcd00e73a0e540989cad69d7173bcaa52b03789ab
+size 234881024
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2b8424e01427598f88f9e4f6726dddef051ada6
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b2809fb7cf2c905dc567b5797fbff60c0a8d1d427516aaa90549e600d156000
+size 29360128
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b8b84c52cf35686ff297af4ed4fc1055c9f80bde
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a00694fa6a35fe07b3f4fcccbb069f1c8818f83a3569d0e6a434de7413507007
+size 117440512
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ec8c63b062f0e3315c8e6cdce7d4fb4bb9e41fe
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3674682c097878d565e84ae2086032eddae7c730ed307ea23a1839fa28efb6e0
+size 234881024
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bd594c0c7f20cbea9efb13aab4ceed649c73378b
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d39de324351cecd4a421d7cac7273770f1c2bcf8a071e90e87076016b4df64ed
+size 24150016
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec9e43ee2d27be638762be05480c51c102e7c981
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b1014f4df80e483f09bc35de9f81480764e213cedae7ff2de2e24965e83ffe1
+size 41943040
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dab519d86e3ecab68af598f8da40c825a18db8f6
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9ff6db97b6460bf5ac3f811aa9bcb359ade68b5aa49d0e81cd0c183f952baaa
+size 33554432
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9acfd43bc983951e364a38bb07a240554b9647b1
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21eb0fb1e00d2e5d5a9841903f15a6af8c88506be64ec2e9e128daaa21bb7d2f
+size 234881024
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ebc2fc4060d1ba8a379858e6607ddf1bbf43b4d
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2bb9731cfd6cc9fb6168ebec66c0a046698cd0f30c1d396b7a2916f1c66a8d90
+size 29360128
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b6ee0f8eac5077dd7ab580c9b8fa41e9e103196c
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:daeb39ac3f89bf829fb33a300f924e60457bb795d56257a673783e7045118360
+size 117440512
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a014fdfa5ea2a0c288cfc36ce3db2319d60b5eb
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fa7eb50cec6e453ea3e758b9c5aeaa834e0bbb2fe5291139ea669480b7bd87a6
+size 24150016
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2aace9ff551d4f151a3fc227c61b102f8c1e8a87
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:20aa35400b0928ead288ac0d61b6c4177983cb4f3b61d1e5784499d936a0a95c
+size 41943040
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8bba8b433a0e969d8d51f3ae619d252842fcf1bf
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4fe4ac5a7c1bb15e3e9bbc8080d12530320d6c03c5952628b631d0b633ff2510
+size 33554432
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..72beb9ee6675fb3016eb77cd9ebb1cb3f2cfff31
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:300ec30d9fd9ef96fbab1505d7b94aa5698f9e1d7cb4b16e097340edd34cc7d7
+size 234881024
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9c4b5dc7de88d61f71f38823f922b8b0dc52586b
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81dd114ae889bce4b20fcec2159973a831dca9bbc364f715860e98f7d874ea31
+size 29360128
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dbbb1ff925ca29bdc4ba88ffcf67b4b340547656
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:19fb9c6c329df420f194e5f5b26a0a1a45a52f839d8d27de152808fc8454f162
+size 29360128
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..381452f4dcdb0046c73764358002c6f80e24bcd9
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d89ecdf713d857ae4564034f0d1be97ed87dd5fe17de76c57d55f0522e57d59
+size 117440512
diff --git a/params_shard_162.bin b/params_shard_162.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f3311530244b000ca072520a2c8d273c6728b3d
--- /dev/null
+++ b/params_shard_162.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bbdc6f16a03b9a330d2d87ca4c2e3bbb924491ae79b5f4d6920dfa03e44bada9
+size 24150016
diff --git a/params_shard_163.bin b/params_shard_163.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f3b668b2f90a92fd691a63c91e746c1a762fc033
--- /dev/null
+++ b/params_shard_163.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04fa95ac471eaee7dab7c497257bb379b050c2173f8fd767b3125a6968d7fd29
+size 41943040
diff --git a/params_shard_164.bin b/params_shard_164.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f50f203cd037384453e9f20021f1f5ada67b8c5b
--- /dev/null
+++ b/params_shard_164.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7c49c6ede0ceb18291fb0f46731b9639ce8f66365c32d61c2248f1db332fa81
+size 33554432
diff --git a/params_shard_165.bin b/params_shard_165.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf29164ba5eff2e3186e839c3a1f1caeba52e017
--- /dev/null
+++ b/params_shard_165.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0b1b79f22226c5a93ef2c6c255636b15f027e701d674ddf546cd963e6499ede
+size 234881024
diff --git a/params_shard_166.bin b/params_shard_166.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b6d895fac3b7fa13711a72415e44fa247bd91e72
--- /dev/null
+++ b/params_shard_166.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04400557fc27f5b2f32a7a476c94cd480582973aec02718d2861e83cfc709e93
+size 29360128
diff --git a/params_shard_167.bin b/params_shard_167.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c63cc34a93b50a59d2524adcc9d4936f3b66bb90
--- /dev/null
+++ b/params_shard_167.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a504a177863dcb08bead0767508423053698aa96395d663c6bbf72e8bdcfd9c6
+size 117440512
diff --git a/params_shard_168.bin b/params_shard_168.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b58d186d38ce80f33a359babbcfef6c5861314a
--- /dev/null
+++ b/params_shard_168.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38055fb3c31d27b24cba9ef91f227617ca567e93022dab57156e482246c9311e
+size 24150016
diff --git a/params_shard_169.bin b/params_shard_169.bin
new file mode 100644
index 0000000000000000000000000000000000000000..14e351ed4472f61ae19d06c8dc2e459d152bb151
--- /dev/null
+++ b/params_shard_169.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d55e7208b66df33956606beed8e668d6f1f4fb6f931cbbe630d93f64f67a1d07
+size 41943040
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..21cbb47d503632dd63c8f297616594ad9db7d293
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d558783f0dd8c32d2ba9e68d963db4aeedd4ede2f66e0018e4028ddf1aa24242
+size 117440512
diff --git a/params_shard_170.bin b/params_shard_170.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d3e32ed843fcd2cdc0fa8d4cacf59918b146468
--- /dev/null
+++ b/params_shard_170.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5f6f664e1a5102dd0bf5a080c28e388b460c82ddd20f971aedcf36c0e9a82ef
+size 33554432
diff --git a/params_shard_171.bin b/params_shard_171.bin
new file mode 100644
index 0000000000000000000000000000000000000000..65d2be313f9f7a6ce38d67abaf347d7c70e94337
--- /dev/null
+++ b/params_shard_171.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0fb8e1ed2c455790e31ce34a3e83ef98ecba307b09163a9c7a22b7cee68ed723
+size 234881024
diff --git a/params_shard_172.bin b/params_shard_172.bin
new file mode 100644
index 0000000000000000000000000000000000000000..40b2a2e2861fd6b658686ce4e40f3ba7261e7d38
--- /dev/null
+++ b/params_shard_172.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e21ccfb4858f5b0b18b1cd3c706426914990be1787d3f5d8ff5155e05cf8c1a
+size 29360128
diff --git a/params_shard_173.bin b/params_shard_173.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3dc03fd37f10c19e959716353e8a98d2e96dcd2d
--- /dev/null
+++ b/params_shard_173.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1150e62b37e247a755df27fce9d06a132448816ce927fa2b05ed37c65c3c81be
+size 117440512
diff --git a/params_shard_174.bin b/params_shard_174.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7b3bdceb5f7583094b8d29a431142900966038f6
--- /dev/null
+++ b/params_shard_174.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e357478826064e0ec86a96ab951329af3919cc54f300d473d902b96820277653
+size 24150016
diff --git a/params_shard_175.bin b/params_shard_175.bin
new file mode 100644
index 0000000000000000000000000000000000000000..128999ef7d90f8099f3774b639763b6380dae315
--- /dev/null
+++ b/params_shard_175.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c805d5edfab9970ef2f55e49295de7a1847b9b210cf25f258098d4ea804a1155
+size 41943040
diff --git a/params_shard_176.bin b/params_shard_176.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1fe789a17bc28e7d011df6e37b28f2c1a5d395f5
--- /dev/null
+++ b/params_shard_176.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6b9b82d57e051dd94744ace82f65814dfec6f5929deab55ca9958f86cf9d2a1
+size 33554432
diff --git a/params_shard_177.bin b/params_shard_177.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b453368bc8ed3accabe5bf7fa32df4f77a9298d3
--- /dev/null
+++ b/params_shard_177.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:19519599bd596f6decc09899af921d7d24f37d0ba225c450b0f37993aca8dea2
+size 234881024
diff --git a/params_shard_178.bin b/params_shard_178.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee4d2a3a702b0174696bb87f8ccbd7abae6155a0
--- /dev/null
+++ b/params_shard_178.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ac01a6f2c596990f749c6774cd8c4d6cb1731b69c31e32193b52c4c6dd9b16b
+size 29360128
diff --git a/params_shard_179.bin b/params_shard_179.bin
new file mode 100644
index 0000000000000000000000000000000000000000..be791ac4862dbf2ffbd7aa668dc2444567164b7a
--- /dev/null
+++ b/params_shard_179.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e564e66c64ab3edf07173c80fbf6f9c8d3eea4104833ddcadc2edfcfc41fa88
+size 117440512
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cef1756a06b53f71949e450affccad9eec2a86ad
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aaba111deceeffe4517d9253444372abd0103a7e1d254a631e04b834efee3ef3
+size 28344320
diff --git a/params_shard_180.bin b/params_shard_180.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9147a48324c69552eacde45b23ed207bcd3162e3
--- /dev/null
+++ b/params_shard_180.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30cf54c6513c37991f8a0dac9f6fc7523a0325c73ec38eac75b880e4d7e27e98
+size 24150016
diff --git a/params_shard_181.bin b/params_shard_181.bin
new file mode 100644
index 0000000000000000000000000000000000000000..77240be9c781a6217fbde085d5d93e89e543c29f
--- /dev/null
+++ b/params_shard_181.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:592d09a92da902c06b8b96f86d23ec97406b062459c64a490ee54fde02ff4644
+size 41943040
diff --git a/params_shard_182.bin b/params_shard_182.bin
new file mode 100644
index 0000000000000000000000000000000000000000..25edc6dbb05eb32225b3012ab2ac31a341491358
--- /dev/null
+++ b/params_shard_182.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36573f9f3f8015de0b42729c9d0c74c4beadd81c740488387275b03ea1e0ce16
+size 33554432
diff --git a/params_shard_183.bin b/params_shard_183.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e03634620e8055b12012d014a7bf9f028c8b9b3
--- /dev/null
+++ b/params_shard_183.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0f8f7ef2c7d568111f7be763cc94accdb82d3702a56cce29bea599094e3f045
+size 234881024
diff --git a/params_shard_184.bin b/params_shard_184.bin
new file mode 100644
index 0000000000000000000000000000000000000000..63bf5a6a97937bbf9e3a169cf5f3f65a7dbdcce1
--- /dev/null
+++ b/params_shard_184.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30fd62e24256562bcd6dcfaff1b7582055ed19dfe2cce8cdb249a6e0cf39165f
+size 29360128
diff --git a/params_shard_185.bin b/params_shard_185.bin
new file mode 100644
index 0000000000000000000000000000000000000000..160ba40ec43153a404963dffab9536411a544c36
--- /dev/null
+++ b/params_shard_185.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b53a52030495caa166fd81b165421e2d8a1d199d676d406c517ff6f34be25f66
+size 117440512
diff --git a/params_shard_186.bin b/params_shard_186.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bc1153e048aead10c40317a0f82d9756420dc147
--- /dev/null
+++ b/params_shard_186.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4df9b1f674393ae5e165d38a1b3c743b53e1697fcb1051588315753702a5347
+size 24150016
diff --git a/params_shard_187.bin b/params_shard_187.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74dc25c01250b6e84a9c1e8692ff467f77c58698
--- /dev/null
+++ b/params_shard_187.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:193103f322d6199ab571ab0ac654d7c2317296be7b3bc0f9eee427bf6788f9de
+size 41943040
diff --git a/params_shard_188.bin b/params_shard_188.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef06f6b8e19aec0b4c4a71056cd99b9a1dd49624
--- /dev/null
+++ b/params_shard_188.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3fe43ae58cc853d99babfa6c027119cf188fc48777bc83c509b83f00001103a3
+size 33554432
diff --git a/params_shard_189.bin b/params_shard_189.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b1bc4a9204374a6d600a1c38918729e9fd3d289
--- /dev/null
+++ b/params_shard_189.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50fbc6e3de2a0956ceb08a2086839771546cc2ccfa5238e81c3a21d43d05d906
+size 234881024
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1ec4c872e4a1150cd308940ba4108eb7891b6eb0
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3155e4ff32b8ab7a15305c0617392f43b7e1170b4d7dfe10108a6134655bd14
+size 41943040
diff --git a/params_shard_190.bin b/params_shard_190.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5028eb1cdfc0c6a20c06695c57460c5c97e5d2a7
--- /dev/null
+++ b/params_shard_190.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c8a645cbc4ef4810939ca95fe5af938461564d2299f06c62de0c3f99a800928
+size 29360128
diff --git a/params_shard_191.bin b/params_shard_191.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6dbc2dd53841ead684560c514f90dba3111178d3
--- /dev/null
+++ b/params_shard_191.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:995a4abb7acde78872eab45b0ad4d89d488b0b0441e15c73eba2bea063e7b183
+size 117440512
diff --git a/params_shard_192.bin b/params_shard_192.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a19f3b93a6991e61d0d7a2ded94b41b133537d2
--- /dev/null
+++ b/params_shard_192.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:750b0abab93ce3ff94a513c6a3a3e7eafe4336222da89fece2f310cd2c2175ef
+size 24150016
diff --git a/params_shard_193.bin b/params_shard_193.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d58f87268adc1d9a9896d881db67a62f4655a7a
--- /dev/null
+++ b/params_shard_193.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4cc6c7a449e994fdd85aca847482dfde146af0876188a5bc6693be59dff4b9d7
+size 41943040
diff --git a/params_shard_194.bin b/params_shard_194.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee79a7106f7d0107fae88892aae3aa38327d6aff
--- /dev/null
+++ b/params_shard_194.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf0c2aed1005b0367f05b69ccec1ca0671f6bacbd061d132ac4c79fd5c6f399d
+size 33554432
diff --git a/params_shard_195.bin b/params_shard_195.bin
new file mode 100644
index 0000000000000000000000000000000000000000..02f6a6e673d7586bcb1d0a32ce75e8ec97c21713
--- /dev/null
+++ b/params_shard_195.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82e9ab23edc501fdfce3e0a21adabe03c74e727d601e5e46ea29a3ab0121a6cb
+size 234881024
diff --git a/params_shard_196.bin b/params_shard_196.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d25bbea4b5c9d01f6961d2600e0f198446de0bc
--- /dev/null
+++ b/params_shard_196.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6fad67f53ee23d9f73e347f3e5b6340f198d72c2e2e1212f2f12f5b16396176e
+size 29360128
diff --git a/params_shard_197.bin b/params_shard_197.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2db9adc1daa5a6fea34ad5032813afd8e0bd81c2
--- /dev/null
+++ b/params_shard_197.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:870a4754dc31ad202066c69cd82ba494dca74ff3cdf4532a994d4cb318e9b061
+size 117440512
diff --git a/params_shard_198.bin b/params_shard_198.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e68093efd4741a223c001bed7c26e684d49b42e7
--- /dev/null
+++ b/params_shard_198.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:521aad352273d8d0ec45f0fb18df3b6ad3a0c8c9f27ad3151e0c821a4660f633
+size 24150016
diff --git a/params_shard_199.bin b/params_shard_199.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d47bc3c0c369ba626cfcc4d01faf4b3ffbc287a
--- /dev/null
+++ b/params_shard_199.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b8b93705e2a438b02238e798af602e44c0b1ecd4a495de71bb4081216fe060e
+size 41943040
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b66a1f6d819cc683ee91a8255f0d25c177fb44ae
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ea8f8403be27fc52261c49cd3e17246b3de0f388c1ce5db43fd69cd4ba47853
+size 41943040
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..96370ed90a3ade0b77bc93e9f584ef388686eb8b
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3606eccacd31df8f31debdf03ee23828e343418c6c47475dad31b80d896dd6c
+size 33554432
diff --git a/params_shard_200.bin b/params_shard_200.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d0e0615bfa3debf4b8bfbd048eae7e3d77eb25f5
--- /dev/null
+++ b/params_shard_200.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e23580868591b50e0938afc92e1e4bdbf3086a2458a9755c1c2768c3285633a6
+size 33554432
diff --git a/params_shard_201.bin b/params_shard_201.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e26f3d9e62148a52385f2b2f1faf5f0f09675aca
--- /dev/null
+++ b/params_shard_201.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:657ad08161a9047e69a25fd588f8f58f0bb911fe60e925cd135117403f0efdba
+size 234881024
diff --git a/params_shard_202.bin b/params_shard_202.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74282938028e694ba3712363b72c844a236a120e
--- /dev/null
+++ b/params_shard_202.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c6aa366d77d93f8a2f9b4391c277b63e7478127d392a5b27c0660d754374258
+size 29360128
diff --git a/params_shard_203.bin b/params_shard_203.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c1bea88f8c996bab529ebb51fb6fdc307aa233a3
--- /dev/null
+++ b/params_shard_203.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95c67e4828023c7d09fd4c553d4847c2447b94054ab272c2c0473ce66b7a10f4
+size 117440512
diff --git a/params_shard_204.bin b/params_shard_204.bin
new file mode 100644
index 0000000000000000000000000000000000000000..265e61b339e3152e601dfb93763ada2b588dc5fd
--- /dev/null
+++ b/params_shard_204.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8262b3e33c7bf4a414c5883b9bc7d1c82e049902b51ed658955bcabe10531143
+size 24150016
diff --git a/params_shard_205.bin b/params_shard_205.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4dee2d98fa3718c5e4708a5971b76cffcbe218a2
--- /dev/null
+++ b/params_shard_205.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ed45a8641525b8de61d2dc04e9f3ce1a5c17cb3a011266773b50ad2e9109f9f5
+size 41943040
diff --git a/params_shard_206.bin b/params_shard_206.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f5a0602f815c1ca1af84757a1496b40a945c0b8
--- /dev/null
+++ b/params_shard_206.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:957c7cfb6543bbde8e951b1d3b07393307fa20b5b83c69c175f8a703a3018d4a
+size 33554432
diff --git a/params_shard_207.bin b/params_shard_207.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5527c19944bcb688a2cb3cfff02399efd0ef5f62
--- /dev/null
+++ b/params_shard_207.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c82c79cd301e475a49b2613d29884fb28569e9209215071daf49f38c094cef37
+size 234881024
diff --git a/params_shard_208.bin b/params_shard_208.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58bc7378f489c7e3f291ef2af1140e34dbdd5245
--- /dev/null
+++ b/params_shard_208.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9cfb9c611091d66fddc50a133a13324e206872d73e228ba7d87e23a25aa7b6e
+size 29360128
diff --git a/params_shard_209.bin b/params_shard_209.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d63f508580aedbca13920c6d509f40cc3c4ba5e
--- /dev/null
+++ b/params_shard_209.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15ab76b8374bd3f22741572fb51c1800f5859c4beb1b0ba21e0c0ef7249b568a
+size 117440512
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2002c40f4419795e3f543d521b13c5ab75f4ffdb
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:055cdb31d01decb78bfe3893214d1d9968d52043d24504d08229db427c4ab43c
+size 234881024
diff --git a/params_shard_210.bin b/params_shard_210.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0ac279b9b5af91aaf36ed6a6d4adfbeb1ba7fe76
--- /dev/null
+++ b/params_shard_210.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c815351c2c9ac1e445f13a5bac39c9ad61f0e521d02551cf279ee93b0d74f436
+size 24150016
diff --git a/params_shard_211.bin b/params_shard_211.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4ca2f4b4302879c1506b8adb9e9bed537e2a2f21
--- /dev/null
+++ b/params_shard_211.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f346c80c1a0dea3871b7ad6e0d51003783e8140d61075444060c90a4ac97ac61
+size 41943040
diff --git a/params_shard_212.bin b/params_shard_212.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d91a9174ef4f8c0f8e2302b7298d134e8a5ce001
--- /dev/null
+++ b/params_shard_212.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5e866f0c5418c29a006bc5d08a0f71ba3ab1d32e23d06cac41548d3dbedcea7
+size 33554432
diff --git a/params_shard_213.bin b/params_shard_213.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e268fce38eca1186861e432a5027be60323a65f2
--- /dev/null
+++ b/params_shard_213.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9960250ac9049fab090ee3a09dc7ba1fd0c7835d241f6f7c3e151b58af5fe359
+size 234881024
diff --git a/params_shard_214.bin b/params_shard_214.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c5ada2acf82b4c31e9a21edfd0d6c7450893ce9f
--- /dev/null
+++ b/params_shard_214.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:809e8198e51c4039043d236d98dc4235df0c907f94b19aea868b16cf11d95991
+size 29360128
diff --git a/params_shard_215.bin b/params_shard_215.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3e123caebf9615a24740db72cc5cc45c2168fe9b
--- /dev/null
+++ b/params_shard_215.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a9d58138c209feb3fa58584f693db20d23ee7337f3b1ec2d6b06f816b8e27fe
+size 117440512
diff --git a/params_shard_216.bin b/params_shard_216.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7f7a290d6a93183159b88e47db4d4c0b78e6d4c1
--- /dev/null
+++ b/params_shard_216.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:326e373bc5e38c481425566e924a659bd555681a82b077dfaa2bf1b66ecaafc2
+size 24150016
diff --git a/params_shard_217.bin b/params_shard_217.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b29e433019a657095324197a0ce4c5ccf4721f9d
--- /dev/null
+++ b/params_shard_217.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b42bdb9e17ead1af9c32579659622854ca308b9e78da8c7f251b040ec6d46b0c
+size 41943040
diff --git a/params_shard_218.bin b/params_shard_218.bin
new file mode 100644
index 0000000000000000000000000000000000000000..918e8489c04a5dff4bcc088bc1b314e7cdca1e0d
--- /dev/null
+++ b/params_shard_218.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a9edafcd37c717c3d3beefacdd2ce7818950a7194fb5aa39877946f759130c4f
+size 33554432
diff --git a/params_shard_219.bin b/params_shard_219.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a246502bf784b8a43d86ecc0fb26ebb7a1fa3831
--- /dev/null
+++ b/params_shard_219.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b7b73a6e4ae1c9423256ab8650f2887d98d1d9dc90fa0198b6902b9f8ae934f
+size 234881024
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9777ccd54f6cc73fbe0be69f61ab1672fee574f9
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:960a14f32637a76f552bbd2e18c4fe028d5745f7c68305ec0b7fe93ddd4d1cb2
+size 29360128
diff --git a/params_shard_220.bin b/params_shard_220.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cfacce0b1ef8057446106770ae9350c1aa362b2c
--- /dev/null
+++ b/params_shard_220.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17f57dcdb6ea9d34e60e5e8a952d09cebd4186e4f6fed462a9e749155830977e
+size 29360128
diff --git a/params_shard_221.bin b/params_shard_221.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ebbf24df58d3c36edc4db606482562e2ac87f9e0
--- /dev/null
+++ b/params_shard_221.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b47bf7e49fd4aa76ef91a09108f1f2767dc2c05934956c5487001f3d2795cba6
+size 117440512
diff --git a/params_shard_222.bin b/params_shard_222.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3041db5cad8c83f2b9ad9b51099cf7beea7d4aa6
--- /dev/null
+++ b/params_shard_222.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e6e4a34c3eeeeaa6986eacab2e46702fd8bd251b04b513ec0ed96ae2d42076e
+size 24150016
diff --git a/params_shard_223.bin b/params_shard_223.bin
new file mode 100644
index 0000000000000000000000000000000000000000..66a5c792a71cb9f674e0d85953ab78e0a59868ce
--- /dev/null
+++ b/params_shard_223.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09a4660ba63e872ff8fcdea3ed68554c93615401b1a70d7b0d9ac94db17a43ed
+size 41943040
diff --git a/params_shard_224.bin b/params_shard_224.bin
new file mode 100644
index 0000000000000000000000000000000000000000..789d4629e4a05fd1ed13031e9ba2b12c5edbac4e
--- /dev/null
+++ b/params_shard_224.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e8bf215a5856584d4f36966e73fc45bb87060ec38efaa7a1e7b3b80b1efa0c9
+size 33554432
diff --git a/params_shard_225.bin b/params_shard_225.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e892d7e61086f2bf0bd8c54de86d11e97c1b64a5
--- /dev/null
+++ b/params_shard_225.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bd53b0da664d96e552b72cf3474bf65b4cbb0eb191e066d0093125e0d71c5bf7
+size 234881024
diff --git a/params_shard_226.bin b/params_shard_226.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9969480871466f8b5aaccb215ec7f3bd7ce5be3f
--- /dev/null
+++ b/params_shard_226.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:966e9f6e9fdedf668ebb46b490afcd18e96a032f05f34022d774c0cef549b57b
+size 29360128
diff --git a/params_shard_227.bin b/params_shard_227.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b812096a8fa63a7a62f4ea9f2fcaad84c468cc4d
--- /dev/null
+++ b/params_shard_227.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:641303f20d022b08d9fda92e661f467566b1c41e35a7983b053ffe5e72c0e2d7
+size 117440512
diff --git a/params_shard_228.bin b/params_shard_228.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da5856a496dc639ab7665c71d29ea3b164027732
--- /dev/null
+++ b/params_shard_228.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6404f732dbcd9f6f9251de6fa2e6a75b252ec3fd63b082f82fc9b60f99b5a93
+size 24150016
diff --git a/params_shard_229.bin b/params_shard_229.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f94e8a5daea421edf67cec915054eab4caf10779
--- /dev/null
+++ b/params_shard_229.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:66ba0742a3426b8d2259c832078d45a7fae6eb79993060b8473e834e4c7d3a60
+size 41943040
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5e538db3c95dc2ffdf5500c300bbdb1bbda43b3d
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a4746e8324386c0cf8146ab318f8f0a79a0820daec5f5baf4d545e5330a1b29d
+size 117440512
diff --git a/params_shard_230.bin b/params_shard_230.bin
new file mode 100644
index 0000000000000000000000000000000000000000..376f0355d56d306be9a90728180b5447295bd28e
--- /dev/null
+++ b/params_shard_230.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec2701e62e09b9edfdc8dbdc174b0823b62bf95f9a9155b3834b57df694095b1
+size 33554432
diff --git a/params_shard_231.bin b/params_shard_231.bin
new file mode 100644
index 0000000000000000000000000000000000000000..64b547e49d6cb0f9d8e8276f47ad1aa2d23ed056
--- /dev/null
+++ b/params_shard_231.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b47f74baec623a277386bf5ad89b5be8d58d03c28f760cf7d697c766b09856d
+size 234881024
diff --git a/params_shard_232.bin b/params_shard_232.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92c76cba6f1d05a76bd284ecb40ae19f08bad391
--- /dev/null
+++ b/params_shard_232.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:809462a6bece44f06b9e93d79c1ba8349f4b3b917c50be227618b742bd893488
+size 29360128
diff --git a/params_shard_233.bin b/params_shard_233.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3c7fa77021ee13ce719addc6a1a0330de4f4cdf7
--- /dev/null
+++ b/params_shard_233.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5ca28114756b5bb9282d270ff37b800e90bf267d616f0fc24226f38439b11e4
+size 117440512
diff --git a/params_shard_234.bin b/params_shard_234.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dd1bd44199b7e77e7b3c5b922607f67352f70f1a
--- /dev/null
+++ b/params_shard_234.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0ddf84167f0f9e12b00f845a2a096263da5274689e96b4cf5e886c4e2c3e9f71
+size 24150016
diff --git a/params_shard_235.bin b/params_shard_235.bin
new file mode 100644
index 0000000000000000000000000000000000000000..588e519cfe78070c93e1b15e7b83d0fc9b794a3b
--- /dev/null
+++ b/params_shard_235.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1476c83eda133b7a9437063efc3af382f54bced18fbc0af0275efa40de325c4
+size 41943040
diff --git a/params_shard_236.bin b/params_shard_236.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7caa3de3e4528eeebca1dd8a2e2f3714b9a6d115
--- /dev/null
+++ b/params_shard_236.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76c71158d9a6c37b145b9d0b94073f594642b4f8fc4ea0d3630354f07bc9e9b3
+size 33554432
diff --git a/params_shard_237.bin b/params_shard_237.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b7a55700123cab6cad5be0bb63f748bf95f0c1c4
--- /dev/null
+++ b/params_shard_237.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8983fc9f8943d0ec7550a4ce4214f56e8547f28aa1166763d15625836403a90
+size 234881024
diff --git a/params_shard_238.bin b/params_shard_238.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9cb2ddf6995cc559a680fdbcf502c053f54cedd8
--- /dev/null
+++ b/params_shard_238.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edc58bfc46e6a2770f00da94687819b11d9af888f621461fe287d759ba00adc9
+size 29360128
diff --git a/params_shard_239.bin b/params_shard_239.bin
new file mode 100644
index 0000000000000000000000000000000000000000..09a058748126ac3a048c79c8a28fb7592f097c76
--- /dev/null
+++ b/params_shard_239.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c43e2ed68a43023fbe6274d03c5e68c4e48d18d62160b3acbbec1a1a6414a558
+size 117440512
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a07f2fb72a3dfdba3b46ae3650b6e7477a07a6c3
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:046ae189e9d6b1acedac9edaffbf993534bb1f13b0cee74f29f1e8288b55cf12
+size 24150016
diff --git a/params_shard_240.bin b/params_shard_240.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dbf44a59e04894c3aa771b56db1a19ad0e137fc9
--- /dev/null
+++ b/params_shard_240.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:51704e42a300641debe2aebf1a2402f62cc90ac1c606ae372e98579521e9b890
+size 24150016
diff --git a/params_shard_241.bin b/params_shard_241.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9efabc1ca8d764b3caa95ad1b7be2838fe26342a
--- /dev/null
+++ b/params_shard_241.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e44eb524f9b50881757847886eea56bebb7a836e2d37f5054c8240d4d376b080
+size 41943040
diff --git a/params_shard_242.bin b/params_shard_242.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aac202529efea2391f23ae3537df257d0b4186bf
--- /dev/null
+++ b/params_shard_242.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3326c1cdc718c6aab568c1da6650b7f1209f060dfe7685c65e560e19d3477b65
+size 33554432
diff --git a/params_shard_243.bin b/params_shard_243.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d793fcdc59a3bf0c5b502fae38d2929ddefd115
--- /dev/null
+++ b/params_shard_243.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e7a933091051c1c41bbfcf6d76a3389592cd76e0ab9c18e12a91358c5edd56da
+size 234881024
diff --git a/params_shard_244.bin b/params_shard_244.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f61ebfac9f3bc0974590161fb74d6e5c7de05dc0
--- /dev/null
+++ b/params_shard_244.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb5f04aa4decb9c0b1afc4fac7be26f6e596dca61cf8bce246df32cf3d7da801
+size 29360128
diff --git a/params_shard_245.bin b/params_shard_245.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1719f5ec2176f62cc634ef61114dc747d58bf642
--- /dev/null
+++ b/params_shard_245.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f5560beee1a325d361976296ddafef4db904b7ce213dbf83504b803056368b38
+size 117440512
diff --git a/params_shard_246.bin b/params_shard_246.bin
new file mode 100644
index 0000000000000000000000000000000000000000..442afc340a406f82121c1da3d67c54649b66a176
--- /dev/null
+++ b/params_shard_246.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5720abe60e6f4abbdf58a4580dced77eefe5baf124652dc30134dffeabfe4d76
+size 24150016
diff --git a/params_shard_247.bin b/params_shard_247.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec02f4b47c05cb76654dcf6a3b160cce29f70d1e
--- /dev/null
+++ b/params_shard_247.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:830dfd7a9b13940076dfc0143b5555add858ffa31be300fc15662a4331b2d03b
+size 41943040
diff --git a/params_shard_248.bin b/params_shard_248.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0735c18b4dfb3c7b6eabddf19fb54006dd4ce89c
--- /dev/null
+++ b/params_shard_248.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bcbc1e78db69ead77dbbb1038b602908f9a8a91a4c6adf2ebc26980f2dcdbddf
+size 33554432
diff --git a/params_shard_249.bin b/params_shard_249.bin
new file mode 100644
index 0000000000000000000000000000000000000000..833413d13ee00c049cafb8856e7c1d08a99831ac
--- /dev/null
+++ b/params_shard_249.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:afa995d2abb42b6da0dbfa9cbb0a8c58a2da084305fee1aacfe82b13c1f3d520
+size 234881024
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ba2eeaeef1f87e6439cce53cc98bad72fa12d7b
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21bd6c41078eb6939b227e04aba8439ed9c0066b093b03840fd71dda3412a899
+size 41943040
diff --git a/params_shard_250.bin b/params_shard_250.bin
new file mode 100644
index 0000000000000000000000000000000000000000..849a8b4d9f324b57850c3ddbc3220043911dbd1d
--- /dev/null
+++ b/params_shard_250.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec0a013d3e694e21d89eb9dc15e3ff1580a98b56ba7308781a7d6320858cc77b
+size 29360128
diff --git a/params_shard_251.bin b/params_shard_251.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ad66e8d94d4d91ba61629c0de7c13494a382e43
--- /dev/null
+++ b/params_shard_251.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f1bf7e79188df33ddfc302f1e392d8d430f358b7d4607d7336e092beaddcb852
+size 117440512
diff --git a/params_shard_252.bin b/params_shard_252.bin
new file mode 100644
index 0000000000000000000000000000000000000000..924329f5a42b4e97d86dcc6eeac2ea4964f04390
--- /dev/null
+++ b/params_shard_252.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a2933e0249dcc53e9830ab6db79707e6f1bf3fa266e124cfb3b92915202eb05
+size 24150016
diff --git a/params_shard_253.bin b/params_shard_253.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b6cb0776b285fc51a31d807f16199a549978e99
--- /dev/null
+++ b/params_shard_253.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:007e9e958b0a0a4163b55bb87ee77a191444fdf7e4e4e4e2dab59a4e0b71d67c
+size 41943040
diff --git a/params_shard_254.bin b/params_shard_254.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c2d2b1e941500f1da0c0cb7987f5250f7d33dde
--- /dev/null
+++ b/params_shard_254.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd7dcfd435710bfc07ef229c52a48a2ea4bae7fced870ab4d32c5f43b9b7dfc5
+size 33554432
diff --git a/params_shard_255.bin b/params_shard_255.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5eced983f772eb71ebb6f58e3a1c62524dc44fa5
--- /dev/null
+++ b/params_shard_255.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1ad822d0e03382607d784d13b796636d4da53d7e14cebdfa94aff94c3568c187
+size 234881024
diff --git a/params_shard_256.bin b/params_shard_256.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cd1723e459ed2c01dbbdd580ee6a61f76fb3abf8
--- /dev/null
+++ b/params_shard_256.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da108c697c6bae927485dd1f4ef2a5e2ed76eb759ee3f52d4497ef0281b279d1
+size 29360128
diff --git a/params_shard_257.bin b/params_shard_257.bin
new file mode 100644
index 0000000000000000000000000000000000000000..31c7aca5b85f3317e4b48a73f6bd64c00e773345
--- /dev/null
+++ b/params_shard_257.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18e3a75478b73c17d8dcd77d7426d62b47b830383ebc99d41ad602bf62e631c2
+size 117440512
diff --git a/params_shard_258.bin b/params_shard_258.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f139bf4bc938822062d8eb280738d3ef719bf422
--- /dev/null
+++ b/params_shard_258.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:024d0e606925b0a2e59f61ea3e1751d3e6e613c5fc58022725dbec30767cf7a5
+size 24150016
diff --git a/params_shard_259.bin b/params_shard_259.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9729a8c161b78de66e34634412be1c51cc501bf6
--- /dev/null
+++ b/params_shard_259.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a570a360709de389ce890ea6a89749a3ef0308fd9665ac54615c7521e3df0506
+size 41943040
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d6bb04c2646fae7a23616f0736b442b9c3761114
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83a2446b5ae8997b8016fd0f39ea3fa14bbf58365f1fafc042522cace116a8ab
+size 33554432
diff --git a/params_shard_260.bin b/params_shard_260.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c052da6378a4c1ad6144c3d20029614cee29e149
--- /dev/null
+++ b/params_shard_260.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:576d8d94a375031770a9f191c05e6523f339eda30c6655d5bbcbb4c691476036
+size 33554432
diff --git a/params_shard_261.bin b/params_shard_261.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa29c62362b10cd8e697b9dc7a8c276e536fcfac
--- /dev/null
+++ b/params_shard_261.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:73027faf52ae926b3a967d7fd734b94ba419bef47a0d09661061d645af46d49e
+size 234881024
diff --git a/params_shard_262.bin b/params_shard_262.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2edb0fdad79bcafafa072b1be9568159e45bbfc9
--- /dev/null
+++ b/params_shard_262.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edcf07bba8751b80bac47f88205a84ab68a9c8f3bd75b6692a1f5e2dd33f30cf
+size 29360128
diff --git a/params_shard_263.bin b/params_shard_263.bin
new file mode 100644
index 0000000000000000000000000000000000000000..838d03d007a9b1e7546304f7c07ee73a29df6c17
--- /dev/null
+++ b/params_shard_263.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d4c1365328ca110680367e8c077bfd13ef0c4d304a6d2d2172d903cae87a7ba
+size 117440512
diff --git a/params_shard_264.bin b/params_shard_264.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c3e465a197208228dfedb2565b24a2abe457545
--- /dev/null
+++ b/params_shard_264.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e41ec8dad7dbfcc3b19e2b729f4b8764f9823e8cdc7a351bd6c3d7a86312dc11
+size 24150016
diff --git a/params_shard_265.bin b/params_shard_265.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dcdf0f0a28540f5ef600b820d6b62973a76904bb
--- /dev/null
+++ b/params_shard_265.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43a49cf8274001ea3db2c59c1f969c0d400fdde142b31e18c7d5dd0220c51298
+size 41943040
diff --git a/params_shard_266.bin b/params_shard_266.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f47c139ff2ad03a8d571fd0890cc3ee1bb11062
--- /dev/null
+++ b/params_shard_266.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a878b27343c7aa1af0c4f028aa0bb87220dddb60c743db4abfdbcd55150a4d45
+size 33554432
diff --git a/params_shard_267.bin b/params_shard_267.bin
new file mode 100644
index 0000000000000000000000000000000000000000..44d5f95d3a3642476297304b7f46885ec7defb98
--- /dev/null
+++ b/params_shard_267.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3532d5da5f4f214fed684bed53db24ecc9f85dbec7823d31c3ed071b4a707e05
+size 234881024
diff --git a/params_shard_268.bin b/params_shard_268.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7ce12fa95f5d83f9450426e0be4d7d7d3623b50e
--- /dev/null
+++ b/params_shard_268.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c517215da8636e7dd2914e4188c747ec9a14db48c30f31dde3b469a78e3697bc
+size 29360128
diff --git a/params_shard_269.bin b/params_shard_269.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b6cd2d581b9593e69fbe83545765dd728fcbb496
--- /dev/null
+++ b/params_shard_269.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:050f3f144dcd2c6a58d09c7de5d10840e5a6a66fabd85c3f7ab2bcec445ceb75
+size 117440512
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d8bbf62ace0dfb6e7275a8743bac5a4d88bb9d94
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:03c0be25c6dc3c548f4652b7ed40ba77cf189c70be847dce1ed460d836739bf6
+size 234881024
diff --git a/params_shard_270.bin b/params_shard_270.bin
new file mode 100644
index 0000000000000000000000000000000000000000..056ff13f8ceb91431540372ec08ad02f1bdcda21
--- /dev/null
+++ b/params_shard_270.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6dc3def229a7db53a169a576e5d5bc8c2fdaba9b48d89ddf9ae5624fbbd0f546
+size 24150016
diff --git a/params_shard_271.bin b/params_shard_271.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08a6a373d80e78530470d216311b95c0adb7c1fd
--- /dev/null
+++ b/params_shard_271.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56cb77bef5fa0af19ea1ea4c533206db77cc82aca8e65f33119cf5ed90125af0
+size 41943040
diff --git a/params_shard_272.bin b/params_shard_272.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1128d098beac8291440ea492a751d4050c38a7d5
--- /dev/null
+++ b/params_shard_272.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e6a5ee86c2de9241934a379176dbad53760e875c630def831a5e60ec2bfd377
+size 33554432
diff --git a/params_shard_273.bin b/params_shard_273.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1fc3f765e10c9fa82329caed9bd752955f7920f4
--- /dev/null
+++ b/params_shard_273.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e1a3a4274f897cc3d0f3265a04c6c8249387495cbf1f127118f8529cd92ca61
+size 234881024
diff --git a/params_shard_274.bin b/params_shard_274.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a27a83d260fa3436928e6efcb923c53860fa1952
--- /dev/null
+++ b/params_shard_274.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:948ac9f03a33e06de5b86e4055cc8e1414e4437c13183933907fb064d472511b
+size 29360128
diff --git a/params_shard_275.bin b/params_shard_275.bin
new file mode 100644
index 0000000000000000000000000000000000000000..42c40b4292ca20e67cd55c2a244d8a57b5f7be4e
--- /dev/null
+++ b/params_shard_275.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:623795db8bbae734749c09e278510c18efab9d31b2f4d7250ef65be3b1a5a99a
+size 117440512
diff --git a/params_shard_276.bin b/params_shard_276.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4e23fdde83b3e896b3edd800e059875cfc49033
--- /dev/null
+++ b/params_shard_276.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:16132142e550650705ef6e223dc56a4a5a8cafc3d0e3430a660bf796cc87d1c4
+size 24150016
diff --git a/params_shard_277.bin b/params_shard_277.bin
new file mode 100644
index 0000000000000000000000000000000000000000..364043fb69617135c8e14e658dedaa70bfcb59d8
--- /dev/null
+++ b/params_shard_277.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b1a5f5d2edc3bdbca07a84a2be0f43d6952c69bf17a6e3480d07cd900372bfec
+size 41943040
diff --git a/params_shard_278.bin b/params_shard_278.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0eb89ec0b60b4814774b963dc06af1f2d62799cb
--- /dev/null
+++ b/params_shard_278.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be25fc5b96421b8a624cc8d79a766e945359a04cfe529e9860fc36543161176b
+size 33554432
diff --git a/params_shard_279.bin b/params_shard_279.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cd056554e6424e38e71fec22e5a506d8ae60855
--- /dev/null
+++ b/params_shard_279.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3031c803f855e4a1d0949ac277cc3fcdb1a08fe26f157436e6ed904ec9994f48
+size 234881024
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..69f2cab909323d4448f185b6fa1b29b60bbf6291
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9dff85688cc5cc079894516eec44595b4105891edf6e542b36406594c1951dcb
+size 29360128
diff --git a/params_shard_280.bin b/params_shard_280.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6e2992fa627926596e719efdd6a2b46534377f8d
--- /dev/null
+++ b/params_shard_280.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a150483cf444d480630dbd97b5726635ac7667518573e90a99195067c90742c
+size 29360128
diff --git a/params_shard_281.bin b/params_shard_281.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fc9d40b8c6452edcb70ee19f23847768ba4df3cc
--- /dev/null
+++ b/params_shard_281.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c27a509dfbd89b9a71ac8a92a49bb703d9d7ad14764bb2960df570f9bdb38a3
+size 117440512
diff --git a/params_shard_282.bin b/params_shard_282.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c8e0ea3dac50a68c07cf407200a27b98829249c5
--- /dev/null
+++ b/params_shard_282.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a68701572518a09c4b8a4f28415617ede0f40c58a0b9cf34384dff085062f20e
+size 24150016
diff --git a/params_shard_283.bin b/params_shard_283.bin
new file mode 100644
index 0000000000000000000000000000000000000000..70e5c7df39882425b1dfb08e6e4a5c3e89016f27
--- /dev/null
+++ b/params_shard_283.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:103b6f56978d1cca85985c17bab796578666a6c5ddc43160d76cafb994370961
+size 41943040
diff --git a/params_shard_284.bin b/params_shard_284.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4d0f0ad89c07240d12cb3271e3fe1f0e5f5e1eb
--- /dev/null
+++ b/params_shard_284.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3916adb2171c8f7e17a70255536ba541a528db83ac7f5ee9a1d1dc46e73f281a
+size 33554432
diff --git a/params_shard_285.bin b/params_shard_285.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b781d9e266b4113dfaefdd1d8c8de6c5b575ac8e
--- /dev/null
+++ b/params_shard_285.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:416fed051a6a1266acc9fe7755ca306b5eaa706babb9a57f68dd8c9faf88dccd
+size 234881024
diff --git a/params_shard_286.bin b/params_shard_286.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a4b7f2eb11cea4a3d163bdad11b3f87b6645a734
--- /dev/null
+++ b/params_shard_286.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:753db0d821faf10f728655025c0e84f03b63884cc3c7cb1cfb3b9b56e5cba8ab
+size 29360128
diff --git a/params_shard_287.bin b/params_shard_287.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b53de0928bf94feec0e85b107c3a048225ffab60
--- /dev/null
+++ b/params_shard_287.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3fe06d8862ca169a722311b938738591bc321d541eda11e404c154f720ddfd4
+size 117440512
diff --git a/params_shard_288.bin b/params_shard_288.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7fd888d8c3e613bce4a1233e97d5efb1a6d3fd81
--- /dev/null
+++ b/params_shard_288.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eaca6ded4ae4fe9088621b25f8c63d177950ad522fa54122ecb3a00f1371c104
+size 24150016
diff --git a/params_shard_289.bin b/params_shard_289.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2eaea82125b3ec5bf50db245636d83c017b39412
--- /dev/null
+++ b/params_shard_289.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6677dc67b60ce2922dbffe5c85bde4529725baa8b6c3dbccabb33348c110aef4
+size 41943040
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed4ad41173f443baf51b1836743b695cb3c6f14a
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58bda659d1467346bf680957bd9788208f0e0e30326acb3315695807c07177e1
+size 117440512
diff --git a/params_shard_290.bin b/params_shard_290.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e338f2e9e0b1675bf7d41ddb433398cf1101485b
--- /dev/null
+++ b/params_shard_290.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccb290fdebdad360e5922909a32ea630cd95976769fa5a7d1e813c06ec144013
+size 33554432
diff --git a/params_shard_291.bin b/params_shard_291.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf9b5706271550c5c438cfeb4c4966c16a44949e
--- /dev/null
+++ b/params_shard_291.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40bb281eefc9a8ad5b7c8618af4813a2dee1edcaa0a9941a499b9f9c63ba30d2
+size 234881024
diff --git a/params_shard_292.bin b/params_shard_292.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07414d5744a67055759e4d07f4df93c1ea54f72f
--- /dev/null
+++ b/params_shard_292.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f528cfba8047ae2e2d0259477e6a874c9d139ce06426de3fecc81712df82bb18
+size 29360128
diff --git a/params_shard_293.bin b/params_shard_293.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a51d313f2d3cebde4ce5560e68110d60d4986391
--- /dev/null
+++ b/params_shard_293.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17e0dc614e16995a91c922f270587a6ff8c5ccaf1698a3ff9338b38ae7268095
+size 117440512
diff --git a/params_shard_294.bin b/params_shard_294.bin
new file mode 100644
index 0000000000000000000000000000000000000000..374bc4d7254eaf46e4080ef6fc4d3d198ea3f564
--- /dev/null
+++ b/params_shard_294.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7363f2b8a5147bfc104d478dda949b6a0ec4258c3830502b192cbed85447d636
+size 24150016
diff --git a/params_shard_295.bin b/params_shard_295.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ad1f084e98b58c09695f56261f3cfaaf8db3ae5
--- /dev/null
+++ b/params_shard_295.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8dbbb8b238f2e6ac8b2e14b788a2f1ae252d4711fa1c651d3e6c8753c0a9190
+size 41943040
diff --git a/params_shard_296.bin b/params_shard_296.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3017c21818a8e1c92bf253165a3e0e0269cac38
--- /dev/null
+++ b/params_shard_296.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0001bf9233ac40ab69638d651e537345d0e5b996064dd8936e4efc382f36f495
+size 33554432
diff --git a/params_shard_297.bin b/params_shard_297.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3389cfe5aac730637c9f960ef3dae4978abad76c
--- /dev/null
+++ b/params_shard_297.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f12ab4054025ceea6a813841ed87973d8421fea5593f46e388b98e0e10b6365d
+size 234881024
diff --git a/params_shard_298.bin b/params_shard_298.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ff5c29a9695186728a21d15f2e88fb24f02c216c
--- /dev/null
+++ b/params_shard_298.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:331e24ac4e609003a78d833e9bcf43d4c87288fba2bc627df912da3e46e6bb2d
+size 29360128
diff --git a/params_shard_299.bin b/params_shard_299.bin
new file mode 100644
index 0000000000000000000000000000000000000000..68d06a0a075435e21fa3038e8f50e085806f352f
--- /dev/null
+++ b/params_shard_299.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef1d5ea5fe0cdfd9f43a89ebcfbdd158e736cf81a9ad11de13fea78e10fc978e
+size 117440512
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b01cb16ad7344a45fb5eaf087de7aad4f344c585
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6510ae77ca673bb2b9ebc48e7b11a3a73cf75861bf84c681fa47f45a5d07ebcd
+size 33554432
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bed6b0097de72eee6e3015f82b21c2e3b0591af
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e87b321f2f852dd2918fbfb81b82dd2cfdc9c8a32437f455645272be7bf8db1d
+size 24150016
diff --git a/params_shard_300.bin b/params_shard_300.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7621d5fb4f0de7f18a29c2a144c77bbf154325b8
--- /dev/null
+++ b/params_shard_300.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1fa2c0286593828826b3603d90ce9df317aac83b8478d864d80ea16b4c64b2fd
+size 24150016
diff --git a/params_shard_301.bin b/params_shard_301.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a54391951929c55ba84eea264d96be5d0c7902d3
--- /dev/null
+++ b/params_shard_301.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c6d3c38d0f72dbc5ff9cda533c7d33c5833ca967cf4e600b3cc36923d69c64b
+size 41943040
diff --git a/params_shard_302.bin b/params_shard_302.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d6a21131804cdd3f3ddf502f36acb8ac9d4dd65
--- /dev/null
+++ b/params_shard_302.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e05072fc961f6bf866dd2f33917832c864601f2ef18325ff367befc7cd98f24
+size 33554432
diff --git a/params_shard_303.bin b/params_shard_303.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bc036a1a44b045b2172e75a199a4023c80616876
--- /dev/null
+++ b/params_shard_303.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c2f4951b1f1380548208a3be18c0ec20403314a12088e1ba64a1947d4eb5f59
+size 234881024
diff --git a/params_shard_304.bin b/params_shard_304.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79c478f38eca61a6e1d1efaccf414bd432a9c7b7
--- /dev/null
+++ b/params_shard_304.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c3d4a192f849a535865ecfbcfd35ed1e40373cdf885ebec432e96037f17b0109
+size 29360128
diff --git a/params_shard_305.bin b/params_shard_305.bin
new file mode 100644
index 0000000000000000000000000000000000000000..108dc4b2c72eca3d9d843906dbef6fba4d5e0d45
--- /dev/null
+++ b/params_shard_305.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf568a5f955b551647af18c5c1becd5f33d34ff4699646e7b6d1c4d83793cc04
+size 117440512
diff --git a/params_shard_306.bin b/params_shard_306.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8c6678feb60f73841b3d6c9e07eb4ca525056496
--- /dev/null
+++ b/params_shard_306.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:181a1ccebecbd040ec22e37ddf6bfa54914d613a2a2664cfdbdd0952904318f7
+size 24150016
diff --git a/params_shard_307.bin b/params_shard_307.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d0330a01db8b4e6ea2869d1175fd0911974d9a7f
--- /dev/null
+++ b/params_shard_307.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6c6fd8960a4dd9eca3a4c66021e45736a73f33dc136e45c0ef1370ce5a403603
+size 41943040
diff --git a/params_shard_308.bin b/params_shard_308.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5e590b0e0176e3cce7b437fe2846bde17e2c35b6
--- /dev/null
+++ b/params_shard_308.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00b9a843f9532816ccae53725a2d2578f667c23ddd40171dc3c4e40982a0370c
+size 33554432
diff --git a/params_shard_309.bin b/params_shard_309.bin
new file mode 100644
index 0000000000000000000000000000000000000000..11bb291a71a6c1954ce5da29076003c4dad68e9c
--- /dev/null
+++ b/params_shard_309.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8058a71ae24c5e54bf2317f912bcd318b960257ee247024bde407a46e08f060f
+size 234881024
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a2a7558cd8a10164b16f13b2d75ab343f2986192
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37a77be0dfc49039ebdf83e596e1e375c9b339b5fdae41aaf25cd7406f9af3b6
+size 41943040
diff --git a/params_shard_310.bin b/params_shard_310.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f8a56c35e60eacad25ceac97692fbe08be118c70
--- /dev/null
+++ b/params_shard_310.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84d3c372a92b400f3c1ebc129f36daf6ea5ef6a2e2499e9692d3b4fdd35714b8
+size 29360128
diff --git a/params_shard_311.bin b/params_shard_311.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d230e633e285ae47ed3dfe90fcabebf8a8b912b
--- /dev/null
+++ b/params_shard_311.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cab82f08f58a130262d73626859b1f61dce347ed814dbb530b4d1931e77bf721
+size 117440512
diff --git a/params_shard_312.bin b/params_shard_312.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f4a832e958c3355d4a2cc8ad39887bcf6fa9bb1b
--- /dev/null
+++ b/params_shard_312.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9371d6b84601118ed71abd660b980a4350cf235ae9e5ec8eab77072f2ad1cc29
+size 24150016
diff --git a/params_shard_313.bin b/params_shard_313.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f7466f9e9d3eba048e18b4f2a7c884ae8166f723
--- /dev/null
+++ b/params_shard_313.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81c44aee0a169444cac12e2a5f5b4a70d1c50992ad8faab0e2159d527fb5c1bc
+size 41943040
diff --git a/params_shard_314.bin b/params_shard_314.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3e24092f387164f2767702a848206701e5a59986
--- /dev/null
+++ b/params_shard_314.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eb0c223e6cd428a1d1b4fa2d283d021c42974f6400e763622820210ef1b71055
+size 33554432
diff --git a/params_shard_315.bin b/params_shard_315.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c6646ac24b05e3a81163b4e6b4601b2e87b0cac2
--- /dev/null
+++ b/params_shard_315.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48d160a5b55efeecc3ca7f6ccf79a5ccb5219fa94773378fc46ed9773b0fa066
+size 234881024
diff --git a/params_shard_316.bin b/params_shard_316.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e0fb3c639ab1419807d145d17ae24a75ecef893a
--- /dev/null
+++ b/params_shard_316.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd38f0c1ef7fb3c762fb10d21d876dc582bbeb1536eb5e6d591a8efc899826c2
+size 29360128
diff --git a/params_shard_317.bin b/params_shard_317.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f5c55d4ff1a259a84dcf0447336bc028aa0627cd
--- /dev/null
+++ b/params_shard_317.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:680b807f9b1b511b305ca64fc65c6e5e2ce9ca03e48d7858732475e3d5b06f4f
+size 117440512
diff --git a/params_shard_318.bin b/params_shard_318.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6693e202d15d512aa8990d2b35f5aba39e57e09f
--- /dev/null
+++ b/params_shard_318.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46111e2fa7d3f39b97d9200f80bbd2c9d072fe9f5c5066876fe4bf1407480976
+size 24150016
diff --git a/params_shard_319.bin b/params_shard_319.bin
new file mode 100644
index 0000000000000000000000000000000000000000..faa43a3da16c6142506609ee463c75fb0c855045
--- /dev/null
+++ b/params_shard_319.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6e21f43593d5db64b68b729176a0fbc1870ec21a2e3ef22c1360f74b4f10fb1
+size 41943040
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf74503edf040b8f2b6ae4775c1d2374bc77b912
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:292031444f9f5d57133d572869b0c31cec363376d2d58d3deceeca58a5450d99
+size 33554432
diff --git a/params_shard_320.bin b/params_shard_320.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d3dc6b9ad04dddae16103ba5eec50412a2be98b
--- /dev/null
+++ b/params_shard_320.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3ea18a0fab9df4631fe00fde3c5eb9d7077a2548742d225d30d44594e76bbcd8
+size 33554432
diff --git a/params_shard_321.bin b/params_shard_321.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2271148f9690ac7601e093f7598a735ccbe14ffe
--- /dev/null
+++ b/params_shard_321.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1905d63f63dfba30254c9f6f0c3769cbfdca4a04dd178e1d9ac984ebe18ae984
+size 234881024
diff --git a/params_shard_322.bin b/params_shard_322.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7eec559996f07b64f52b5fee8948bf161d712d89
--- /dev/null
+++ b/params_shard_322.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2beb7108439ac9305bed9c2648947457422ad50ca9976eebbac0766a301b5a0
+size 29360128
diff --git a/params_shard_323.bin b/params_shard_323.bin
new file mode 100644
index 0000000000000000000000000000000000000000..941f19af06eb3240eb9f745a7cbde3d196bcb5f7
--- /dev/null
+++ b/params_shard_323.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fd858e49939f2b3ae1646090d5278d0b45714943d38256a3c4d32e26551f15e0
+size 117440512
diff --git a/params_shard_324.bin b/params_shard_324.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8040973025ae87898cc181b4d5edb860410211d1
--- /dev/null
+++ b/params_shard_324.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0eece4945ee47de59ae81e4f7eaf78f349f259999a62d45327f638f98421f8d4
+size 24150016
diff --git a/params_shard_325.bin b/params_shard_325.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4dc47cbbca6d94e1a745b7f029f3544ad29658ff
--- /dev/null
+++ b/params_shard_325.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6baaeacaf8242ec25823e59ab162cdad8556800f3c1e954066436c6a3f67738
+size 41943040
diff --git a/params_shard_326.bin b/params_shard_326.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a2d3ad6ab89b9df3a7982806a4e660d0c431c19
--- /dev/null
+++ b/params_shard_326.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c3d7f367753c6b72e5522993ae56d368842e01aff05ba99701b8d24cb74ed5b6
+size 33554432
diff --git a/params_shard_327.bin b/params_shard_327.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9975a1ae63fcb1d5a8ea3c1b6175e73ce2cb6931
--- /dev/null
+++ b/params_shard_327.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27f41a50e74eb957930b04ab7d67cb4431ebe26469e8d26881c3cbfe0c2ae6e8
+size 234881024
diff --git a/params_shard_328.bin b/params_shard_328.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9beabc5d9e5483fc46e93c6d685dc180191267cb
--- /dev/null
+++ b/params_shard_328.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07f7fec246ee76856b19de45dbe7e649466871eb7c7b91f08e1c415d371d5850
+size 29360128
diff --git a/params_shard_329.bin b/params_shard_329.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41642b63911fd4fa6e90f5e8ae68b7c0ed654a5b
--- /dev/null
+++ b/params_shard_329.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf871e16740c6e72c065c5ab63bcfcf5b503d91c83e778f90e91a66dcc7205c8
+size 117440512
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e7ac95745d58245f2ac1b04665c14c3a75a5246
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b69330470aad1b8a4492b09e0a15973b87128f3c680b61fca9a3aec588cc3b84
+size 234881024
diff --git a/params_shard_330.bin b/params_shard_330.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d434007828fa82b106720bd179c0de31e359570
--- /dev/null
+++ b/params_shard_330.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf474e835a68dfe03a63034441747e7e15c672e751e21cef43e7f0cf1990cb97
+size 24150016
diff --git a/params_shard_331.bin b/params_shard_331.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33372b0bff12c1998358e248a470217367fbfb10
--- /dev/null
+++ b/params_shard_331.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c35940b90ad9000b098d7d5e2d545a08dcd9bea46da8d628f99fb6c4161076e1
+size 41943040
diff --git a/params_shard_332.bin b/params_shard_332.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f83a7cd877eedef7ca3364181cd07ae9d31f3d0
--- /dev/null
+++ b/params_shard_332.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d7e85c0ec175d07ba39d19ef947f3724887a0ca907870bfaa1c62f52126be005
+size 33554432
diff --git a/params_shard_333.bin b/params_shard_333.bin
new file mode 100644
index 0000000000000000000000000000000000000000..86971d6f479261259463b2f2dc8a9c33daef4357
--- /dev/null
+++ b/params_shard_333.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:183b6626550963cd9240a34c9e5b533cefc0d2ef894b4440a4a4468f267c68dd
+size 234881024
diff --git a/params_shard_334.bin b/params_shard_334.bin
new file mode 100644
index 0000000000000000000000000000000000000000..434eafc5e6740a374be8fcd3a91b319efc68766b
--- /dev/null
+++ b/params_shard_334.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ba3e526a568d9098c92cb412f33e6a6d437c37c5136e67e9606da0da11ed1e4
+size 29360128
diff --git a/params_shard_335.bin b/params_shard_335.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a68bcae3d0126762737febe3e9f97faf001d020
--- /dev/null
+++ b/params_shard_335.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2203029beea4da4bc5cb0c8dd662862257e88a5df3bf8cad37a76fb1fed83ed0
+size 117440512
diff --git a/params_shard_336.bin b/params_shard_336.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4512c36baae2c15922e8529b3b2e2167596dede8
--- /dev/null
+++ b/params_shard_336.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7782602a74f8ce102e0bcc76150dbeef541a409b959a47f92104758af94665f8
+size 24150016
diff --git a/params_shard_337.bin b/params_shard_337.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c415bdcabc9e04b085c820f89a9ba857e6ea9323
--- /dev/null
+++ b/params_shard_337.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3af23fa1ac62028f7127028230bc5b8238dd9f45cbc57d387d465152a7768ef
+size 41943040
diff --git a/params_shard_338.bin b/params_shard_338.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7ec88475c7812cc0b0a999d30d28714b686ba222
--- /dev/null
+++ b/params_shard_338.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e39cf35d426b158244ad567d51fefb8088cfb987c02604ea13191ac5e95800d3
+size 33554432
diff --git a/params_shard_339.bin b/params_shard_339.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e907610d254238bb2f815925e006f04003afbb1a
--- /dev/null
+++ b/params_shard_339.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:664c3b2d2e18bfff55dae9563dd31c1dc71e510f0327f7a1e55b6008ced71433
+size 234881024
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7cfc851b810bddd659ec98f0487ced6f40379072
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a3ea964ad9c350143f0fcb1ed532f84b1ae79d4b962e690c9e52b0bf07f77b9
+size 29360128
diff --git a/params_shard_340.bin b/params_shard_340.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f7e47fba7000ce399462150f0b903c9f3e6b0100
--- /dev/null
+++ b/params_shard_340.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e5e54d891aa6c9b2f00d6fa3fcba67cd408d004da43bd7d6f98d033734eec2e
+size 29360128
diff --git a/params_shard_341.bin b/params_shard_341.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80908972185a9c9da91ea0f643d35628b23ebd0f
--- /dev/null
+++ b/params_shard_341.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:425fba0ee421f16da82e22320eae4939ef32489d13af7a1e6e86af740f22a95a
+size 117440512
diff --git a/params_shard_342.bin b/params_shard_342.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00fa1427547020a338abbe51e68cb563f138de03
--- /dev/null
+++ b/params_shard_342.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b73c58f0533ce5f46e1bf8d18569d9c38b3cbb3f3bda0e3c058536aab7577114
+size 24150016
diff --git a/params_shard_343.bin b/params_shard_343.bin
new file mode 100644
index 0000000000000000000000000000000000000000..96cb3128ba91db97ff9958865e4f081557b1a6e3
--- /dev/null
+++ b/params_shard_343.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d314441ec622d575634e0f4643791b2e4239f8279e43757416c94dddda09e46
+size 41943040
diff --git a/params_shard_344.bin b/params_shard_344.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d6b1a89b7b7ae857b0fedd542526129a44de0b52
--- /dev/null
+++ b/params_shard_344.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7353cfd72ca63670803a75b7a8adb43bf9eb07027e367396407d49f8546f0196
+size 33554432
diff --git a/params_shard_345.bin b/params_shard_345.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b068d8c63036e8799a326af5b9daf3849f503d2
--- /dev/null
+++ b/params_shard_345.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e6e5c72b47472ae092869614b93557f9172ff42fa8f83c176546bdff5d2a6f76
+size 234881024
diff --git a/params_shard_346.bin b/params_shard_346.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bb1a34b22a89584c1e86bfc591d6ac102e0c9c46
--- /dev/null
+++ b/params_shard_346.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:769d1706a1125bce503f643f96a648ece88a8442ef7d67157c1e6a2d2490fc1f
+size 29360128
diff --git a/params_shard_347.bin b/params_shard_347.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7e4da4594345db41901e5ccc952c4f5ae2d6e54c
--- /dev/null
+++ b/params_shard_347.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:47101a754051ebdc63f8d6fee29e1962f02bd2f680bd23b963cd36e4bf98f50e
+size 117440512
diff --git a/params_shard_348.bin b/params_shard_348.bin
new file mode 100644
index 0000000000000000000000000000000000000000..683dfcd824d877cafb6968b0a8c39e05d0908d04
--- /dev/null
+++ b/params_shard_348.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ad743387c702ee6dd138d493496eb8a74a0d91e7f2a4ce34cb055d96d820182
+size 24150016
diff --git a/params_shard_349.bin b/params_shard_349.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7094dcf22094da7fe3fcd1c4ac6dfbf63a0946e8
--- /dev/null
+++ b/params_shard_349.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c6695fc62b4a86008cf568456d0607b0d19d55b70b08faea3a0f8c14b4838e9
+size 41943040
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99ed409c4c928539844808f7a77b6e28d3592c18
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1929dba5969291afb325a85262609cc525cce812c0fd1830fe013389cdcbb6f9
+size 117440512
diff --git a/params_shard_350.bin b/params_shard_350.bin
new file mode 100644
index 0000000000000000000000000000000000000000..057c5eb1956a0bce1904a048476d2456e694a988
--- /dev/null
+++ b/params_shard_350.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e557b963ab81edc60bea26bc52e15bcf40b8824f1b6827577277e786795c2aa2
+size 33554432
diff --git a/params_shard_351.bin b/params_shard_351.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8aa94f9558d23263e526d6bcf230001209ee9730
--- /dev/null
+++ b/params_shard_351.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:338bd138e42047769ab36081ff7e904653ba848c115b742b8197eac9823cc54b
+size 234881024
diff --git a/params_shard_352.bin b/params_shard_352.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3719c747cba6945d93d76edc6aba6e19646efff
--- /dev/null
+++ b/params_shard_352.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba18d4465031c402a1cd8399395830504c84d38b79216a2083dbcb98466f5234
+size 29360128
diff --git a/params_shard_353.bin b/params_shard_353.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29408c5f75e986c06d55ae0921fd54b88420ed10
--- /dev/null
+++ b/params_shard_353.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7135ab653011bb17421e5f009c1cdbc7c1a521efadef0583b0b7c96cff791b6
+size 117440512
diff --git a/params_shard_354.bin b/params_shard_354.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2b4aec1739ececf7f636eb8119ebc1f8ec7039e0
--- /dev/null
+++ b/params_shard_354.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8265c819d835660eac4078e2e8f3e89f8559d66c36b9dc91f8ae21fe2ca82cff
+size 24150016
diff --git a/params_shard_355.bin b/params_shard_355.bin
new file mode 100644
index 0000000000000000000000000000000000000000..687c9993465aadd3f28239cefcbc3e6fd87fc0c3
--- /dev/null
+++ b/params_shard_355.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e96b8bec2f83920c42f3df26ff07915176ca312c4c26ebb1c6905b3071d01fd6
+size 41943040
diff --git a/params_shard_356.bin b/params_shard_356.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bde7031f8595e51ed72ecf4d4044b8d6dcf39e5a
--- /dev/null
+++ b/params_shard_356.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c676c2c8653ff6b280d71261cce26319219190027bd3856819b6468af8866f1
+size 33554432
diff --git a/params_shard_357.bin b/params_shard_357.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d92321975697a0eb6e49c5daaed292b38b26397
--- /dev/null
+++ b/params_shard_357.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8e07d5b1c9ee7386e0c3cef91054e18614aa7f4a02c1acc0052884a6d53396f
+size 234881024
diff --git a/params_shard_358.bin b/params_shard_358.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2eb5182690fb22ce06166ed8e5260334dad7cfba
--- /dev/null
+++ b/params_shard_358.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7398cbfc0b156363df4c362efe0ee8b6bf3a6ed518437d39fbdb520bc6698427
+size 29360128
diff --git a/params_shard_359.bin b/params_shard_359.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4393f1fa6420a84e6931ebcdf078ddd48c1d342
--- /dev/null
+++ b/params_shard_359.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8899b843797a0cbf2965b1b1696f71450d36f89d382e3b97e4ab5eebb8091ebd
+size 117440512
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a7943a43280cc90af9e343e86a2a5a4ed2edfff
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0afb574c729530ff05c5a3aa1af5887f0faef04154e5592fdb56dee9a9d5cea5
+size 24150016
diff --git a/params_shard_360.bin b/params_shard_360.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eca75bf2374f61f170719d2ad041500f70c68055
--- /dev/null
+++ b/params_shard_360.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:db139ba720a1cb32df23e27515d5b91e6bfee00ebef37ac02e4d3f5164a260ca
+size 24150016
diff --git a/params_shard_361.bin b/params_shard_361.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bfbc5b50e28f63668eb2cc1cec9feec928bdb26
--- /dev/null
+++ b/params_shard_361.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2193128a7670ca3d73d79c58d9ea43948408777293d3a8573fd5af4e33cbd873
+size 41943040
diff --git a/params_shard_362.bin b/params_shard_362.bin
new file mode 100644
index 0000000000000000000000000000000000000000..45635761222305b710138b74cbbd7363974f9b70
--- /dev/null
+++ b/params_shard_362.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:537459b66ceb311415f86722316808f419c38907465803a3a5357ee075d3ff0d
+size 33554432
diff --git a/params_shard_363.bin b/params_shard_363.bin
new file mode 100644
index 0000000000000000000000000000000000000000..672ac41749792a4a9945e8f75b6a1d653a605cfb
--- /dev/null
+++ b/params_shard_363.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6c1a851bb4ab53eab2bfc0365a684bb61732a1ccfdc6a6f53a3510c036001f6f
+size 234881024
diff --git a/params_shard_364.bin b/params_shard_364.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e25d521ad39902fb5ad8a54c3051223a8e4279cb
--- /dev/null
+++ b/params_shard_364.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf433079d721ec542bd212fa8fdfddc5b3de6d7df886018c4adbc7615d92cd79
+size 29360128
diff --git a/params_shard_365.bin b/params_shard_365.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c1487bbfd67505df0e9ee543b4c1a1c891686864
--- /dev/null
+++ b/params_shard_365.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:801885cdad3ab0055cb55b9ec5c5d70732643aba31501252a30bd0529fc6da9f
+size 117440512
diff --git a/params_shard_366.bin b/params_shard_366.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b861c85af0f484688d1e80e35a723495210dd1a
--- /dev/null
+++ b/params_shard_366.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1cd6f16525f76baf9f9eb55774cb341d02fa43b6a9fcf0c3a740f638285a0225
+size 24150016
diff --git a/params_shard_367.bin b/params_shard_367.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e62069ca9e3b01c16c2f2502e7345e5ca488553f
--- /dev/null
+++ b/params_shard_367.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1ef28eeb018b0963082a6caa29ab6a56359653a50eb7e5eddcc130677a1a9da
+size 41943040
diff --git a/params_shard_368.bin b/params_shard_368.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e15e6de938476c29b8e56eeddcb90da91b953ce1
--- /dev/null
+++ b/params_shard_368.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9faf972dd4a564fc997f1833e34702c1b1888436a9e39f6e176e0b67c674671b
+size 33554432
diff --git a/params_shard_369.bin b/params_shard_369.bin
new file mode 100644
index 0000000000000000000000000000000000000000..86f83bf0ca034ce42e543847fffe1d3e0ffc28bd
--- /dev/null
+++ b/params_shard_369.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a58947f1367cd1947844376092758ccbb04163a21cdac064699e36f053e5d5b9
+size 234881024
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c350ecdfd045f20561d3b37945fa303864818f5
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea89d68fc58ea9534d9358a35c904e9a9985134872e1eabcc407b7bf41a6cd3e
+size 41943040
diff --git a/params_shard_370.bin b/params_shard_370.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33bc040c41ee2830003a63813bd5f9adb2032267
--- /dev/null
+++ b/params_shard_370.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4a75a5af6cba6f8a2e0bc536738f8febc0762b8c66e96039f7ec703f65f70103
+size 29360128
diff --git a/params_shard_371.bin b/params_shard_371.bin
new file mode 100644
index 0000000000000000000000000000000000000000..17b31fab859369d5608d1185fd4f461901203499
--- /dev/null
+++ b/params_shard_371.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edbcce651efff6a263739e68b64112fb10b030f812b015d63daa6a09c8d530f8
+size 117440512
diff --git a/params_shard_372.bin b/params_shard_372.bin
new file mode 100644
index 0000000000000000000000000000000000000000..74212bf13a943ecbb0410f158120c41839967edf
--- /dev/null
+++ b/params_shard_372.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d7414707078e68b9b8ef325d323cc5a1fce6dbbe2bc651e1af93f0d4f0da848
+size 24150016
diff --git a/params_shard_373.bin b/params_shard_373.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3e237beb77b8e3750547baa86d25b976163035e
--- /dev/null
+++ b/params_shard_373.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54e47dd2ce2f37fbc0c3764c0510badcc2ababe10ea10af96f67f12aea9352a4
+size 41943040
diff --git a/params_shard_374.bin b/params_shard_374.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ddb4a19cee809dac39466a2fdec7dd2270961103
--- /dev/null
+++ b/params_shard_374.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f455b1114b99837899a2fd639c78d36bc9a1df7b3c928178d49506ce390728c8
+size 33554432
diff --git a/params_shard_375.bin b/params_shard_375.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33a5d02a409db9c66050eeb964e31dc8c42f0cfa
--- /dev/null
+++ b/params_shard_375.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bba8a1b04c89c83f9f41f537327992841b34a83fd1eeb6000f2037fd4c1c9559
+size 234881024
diff --git a/params_shard_376.bin b/params_shard_376.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a273334ae8b6671378fa72d0b3290d6582c72732
--- /dev/null
+++ b/params_shard_376.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:10cf745cf2e8f9648ee99ab622d2ca866b9d08c5de8345467bdf11dc1a6e336a
+size 29360128
diff --git a/params_shard_377.bin b/params_shard_377.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0631dffaed7ce2927a014387c5201e465f24299b
--- /dev/null
+++ b/params_shard_377.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a139155712cbdc55c115f2a04807cbc544a4af6399437cf79a99480bd8d72092
+size 117440512
diff --git a/params_shard_378.bin b/params_shard_378.bin
new file mode 100644
index 0000000000000000000000000000000000000000..985e6150e583599d7f0800ecc1612f4fcb288ab2
--- /dev/null
+++ b/params_shard_378.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c8d9da8fd711655f99998eb1aca26ec16f8ff8b8b7289e8a8c08ea54457100e
+size 24150016
diff --git a/params_shard_379.bin b/params_shard_379.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6328013717b9e5585d412652e77c442f02babff3
--- /dev/null
+++ b/params_shard_379.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a153bbd3f953d1a29f017e2e158d8e416088b21446a7664087403d8ab786a940
+size 41943040
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf39ce0570d1a9d0664bbddc60587d24f50f7f84
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f94ee18afe733dae1931ed788e7a1a5a0f98de6cc1d9b198f0446718e4b5c0f
+size 33554432
diff --git a/params_shard_380.bin b/params_shard_380.bin
new file mode 100644
index 0000000000000000000000000000000000000000..930299cec8b7b906a5802afa294cd5980bd2de34
--- /dev/null
+++ b/params_shard_380.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d07e8f6cf8fdc03917de5f7077b0b66e34f0cbf24cae3a74f75434e24231f91
+size 33554432
diff --git a/params_shard_381.bin b/params_shard_381.bin
new file mode 100644
index 0000000000000000000000000000000000000000..245429c862bb7fe2614a4de8d25f558a5db58934
--- /dev/null
+++ b/params_shard_381.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27bef07359d5a92c32fe10cba66a09e7852dab2ae9b2a8aa020ce9796788ccf3
+size 234881024
diff --git a/params_shard_382.bin b/params_shard_382.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ab94e49b30300d3ecd694f3ea3419142c220f066
--- /dev/null
+++ b/params_shard_382.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b1a72a3f3e036f26ecfc74f3a4639503bdb2cee672167a0d2cfbb5d53b09b6f8
+size 29360128
diff --git a/params_shard_383.bin b/params_shard_383.bin
new file mode 100644
index 0000000000000000000000000000000000000000..728956661c9ccf0e1ddffc32b861641fc3c769bb
--- /dev/null
+++ b/params_shard_383.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4c3b54184671389f41c708799f9743bb3c8a326583ddd9ad4e9f3e7da068e4f
+size 117440512
diff --git a/params_shard_384.bin b/params_shard_384.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34640a5dcea91203ae0b2168203718e28a07fd2f
--- /dev/null
+++ b/params_shard_384.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d2f59c1fa43753940b5feef8083201cb4238bc28a29ac7b0ad341023975945a
+size 24150016
diff --git a/params_shard_385.bin b/params_shard_385.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0fac4877c2aa0a9bf5578d1914104ddefd5e2de
--- /dev/null
+++ b/params_shard_385.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a1d44c8e7e7c0ce070e5f75b160b4cb473601e94e2805742bccef5052bee5117
+size 41943040
diff --git a/params_shard_386.bin b/params_shard_386.bin
new file mode 100644
index 0000000000000000000000000000000000000000..27c53e2240505fad8275046a03c551ef324db424
--- /dev/null
+++ b/params_shard_386.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d97f4d9526321879e3bc183e16a11c669de38df8961fd8aa6bb2a30ff7b3caae
+size 33554432
diff --git a/params_shard_387.bin b/params_shard_387.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d7837f5d543ee47add1080cc3d7899e16d73ac3
--- /dev/null
+++ b/params_shard_387.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79216b8ad3898d12b68ada91a80a2b8b582abbef05953340caac4e61aab7895b
+size 234881024
diff --git a/params_shard_388.bin b/params_shard_388.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8b3a95eb6873c7a6e0eb9a4f86b39797fa33aaef
--- /dev/null
+++ b/params_shard_388.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e45873152e9cfb903dbf4fddd8502a3a5b67831fd732bdedcb2870e91a10de45
+size 29360128
diff --git a/params_shard_389.bin b/params_shard_389.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e0f44b694b6fe89bce9ff2a6da57d41b1cb38d8
--- /dev/null
+++ b/params_shard_389.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:214150aa455025d8d0c487eb265428ec00c030ac598889ec5a491c6e3f334c67
+size 117440512
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..486babfd95d256d992d62e42d120e370dde63a85
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:31c807621bf0e531911d415bb4375ee904d87919205fa17a1704a150cb5787b4
+size 234881024
diff --git a/params_shard_390.bin b/params_shard_390.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ea0006d425b79cc267d462a612f0e02f47d93c1
--- /dev/null
+++ b/params_shard_390.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5dde741da10042986979d0a412dc49515fbe23d088f80016168352a1e4c31136
+size 24150016
diff --git a/params_shard_391.bin b/params_shard_391.bin
new file mode 100644
index 0000000000000000000000000000000000000000..750a5f0d756684c303d0fe6aed37c75e3e7f9053
--- /dev/null
+++ b/params_shard_391.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a8478c906c7bd6e8525163897823406371fa1a68aa822c740470b9bb9204552
+size 41943040
diff --git a/params_shard_392.bin b/params_shard_392.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6e63bce422564e02770fdc14a04f3fa9a4c0b617
--- /dev/null
+++ b/params_shard_392.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:157a848c8b67c3b311d3668554a3ff58e088f92bb592e9c7165c32c009fff829
+size 33554432
diff --git a/params_shard_393.bin b/params_shard_393.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8704d8f016a5e2a172e75e949b271c9032bfa1ed
--- /dev/null
+++ b/params_shard_393.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8afdbfa66a819e4203ff6427902742eb628bc547bb6fc8c0314e30ff7234deca
+size 234881024
diff --git a/params_shard_394.bin b/params_shard_394.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ba92be53ec68e3661918c919831a815e2411dd4a
--- /dev/null
+++ b/params_shard_394.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e37a54beb7394ad5e99b5dd4d91fee4e2c96d1a689191363179d3c2a1e9d30f
+size 29360128
diff --git a/params_shard_395.bin b/params_shard_395.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7abe08e8338fb635a86ca24e854512d000b0e026
--- /dev/null
+++ b/params_shard_395.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b0e128dd7aa187e79c050a1c1e3c4448bee6c18e264e1dbac1881fc1e3ec032
+size 117440512
diff --git a/params_shard_396.bin b/params_shard_396.bin
new file mode 100644
index 0000000000000000000000000000000000000000..267dde09cd40e75e6cef48657a29de4b59c8db33
--- /dev/null
+++ b/params_shard_396.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f1b0b4baa87508139c2e2756bb6cee70f0ca21431c5640f60ab5bf3a0df8062
+size 24150016
diff --git a/params_shard_397.bin b/params_shard_397.bin
new file mode 100644
index 0000000000000000000000000000000000000000..793828b9853baa0eeb5044a7d3e36754576e8e7f
--- /dev/null
+++ b/params_shard_397.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a96490ef28041263ea616d99a86a3c55db45a44b1c235982b4038cfc5920b966
+size 41943040
diff --git a/params_shard_398.bin b/params_shard_398.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5bf5bbd886738d15d4a3831ee24100afd4a9be99
--- /dev/null
+++ b/params_shard_398.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9bf4cd49b2e88dd45e97c71c5065196450dace314431bcbce9d10f6ab71016f0
+size 33554432
diff --git a/params_shard_399.bin b/params_shard_399.bin
new file mode 100644
index 0000000000000000000000000000000000000000..94ddb671c257efd78375ea376b72bf1faa3c8b03
--- /dev/null
+++ b/params_shard_399.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59ea4907531fc45ee7684328fdfe1d7830e41db6646ffd0a1dcf8f505a061a9a
+size 234881024
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c5869599eea07b766865bd1315c0d85a6a97e03
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dfc3a126fefc347350e84f475bb6655aad7aa7615eea57c9a01daa2a04077dcf
+size 234881024
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..df94ee6b755edb96ec3a8ae75564be2026e187d0
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:66e4621cd0883032536ba14e3fee1c8cb03952a08bc735799ead048cfe657f71
+size 29360128
diff --git a/params_shard_400.bin b/params_shard_400.bin
new file mode 100644
index 0000000000000000000000000000000000000000..83ba173e787c01bcd7a786c49a98178f912d6c34
--- /dev/null
+++ b/params_shard_400.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22782f15fdd579259a7ff210ec02b3b8f2f2ac078ddc220af74f56f5e21d70c1
+size 29360128
diff --git a/params_shard_401.bin b/params_shard_401.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a1f4e59f802e6512d2209d4035a0d8c77756ee86
--- /dev/null
+++ b/params_shard_401.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:801e4cce1dc2ea7cdb6ead2f32164427f196bba946306173cf5926070670837d
+size 117440512
diff --git a/params_shard_402.bin b/params_shard_402.bin
new file mode 100644
index 0000000000000000000000000000000000000000..913ecfe0726099ecdc20996353462217df870a79
--- /dev/null
+++ b/params_shard_402.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50e275da0fd7973f3861411734aedb725054f66ab489881845f1dae07cdd490f
+size 24150016
diff --git a/params_shard_403.bin b/params_shard_403.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5aa503038e9a8a93b000e9ffff390ef35de9884d
--- /dev/null
+++ b/params_shard_403.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a5a7ec0b3eac12340cda96adcfca90020698916f979f5f86ed11e8c85ec21a3
+size 41943040
diff --git a/params_shard_404.bin b/params_shard_404.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36f41b4f862e69a53b9c80f1c45978bc3215a165
--- /dev/null
+++ b/params_shard_404.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cda825cfc77638b7b31e8afc2cf892664f739528da6eae51a784e09b5d4b5a4c
+size 33554432
diff --git a/params_shard_405.bin b/params_shard_405.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a77f148d44daaf2c834da69d775c7df8efb9e8fc
--- /dev/null
+++ b/params_shard_405.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c25182983dfa6043266ec7b616cf7ae7cd9182bb12ca58579d4f2891d2285cfa
+size 234881024
diff --git a/params_shard_406.bin b/params_shard_406.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4beec71bedaddb17309938a107c42ffea38612b
--- /dev/null
+++ b/params_shard_406.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ad183125ba7f89d547725c7567442c86f92b41c65dbd042568b26060a0e3316e
+size 29360128
diff --git a/params_shard_407.bin b/params_shard_407.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30e4f603c61476c5ee4574f2f6b96df34179466d
--- /dev/null
+++ b/params_shard_407.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb707ff2113a00a2f5f00a9fa93c5df4cab1cf5681bee5c1b9b70d56658c9346
+size 117440512
diff --git a/params_shard_408.bin b/params_shard_408.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4602175672913bb152adae7686dddbaf33f2a8a2
--- /dev/null
+++ b/params_shard_408.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86ace47a5fd4521fdad7d380890f797f369bf766b3626ad5602364e5f3d566f4
+size 24150016
diff --git a/params_shard_409.bin b/params_shard_409.bin
new file mode 100644
index 0000000000000000000000000000000000000000..661d8c884f8efae94c6c33bada532c86ba857c12
--- /dev/null
+++ b/params_shard_409.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e59d19697c0029abcaad5915ea897539cdc1873dcace6b3770c779565a1c5103
+size 41943040
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..78803dd0952f413fdfc285866f1e14c7c5ccdfaa
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7103993e43babd140df50df30edb09ba98064ff27ada31f22d9ceac47b97e88
+size 117440512
diff --git a/params_shard_410.bin b/params_shard_410.bin
new file mode 100644
index 0000000000000000000000000000000000000000..496965526f75d2977607f347f969559013c49905
--- /dev/null
+++ b/params_shard_410.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1648f32ff6c44921bd14fdeb5eba8dfefcf5e8c6934d209bd0aa538ac2932315
+size 33554432
diff --git a/params_shard_411.bin b/params_shard_411.bin
new file mode 100644
index 0000000000000000000000000000000000000000..296d0e086ad0ee187bc05ed45c18d6f5e998467a
--- /dev/null
+++ b/params_shard_411.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:775ac24168f07ee45350d30378cfae5f2cddecf37a5cc224b7731a6e05e758bd
+size 234881024
diff --git a/params_shard_412.bin b/params_shard_412.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f7381a80d87ebd62da51f7f01d56e5c5012f5d7e
--- /dev/null
+++ b/params_shard_412.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:895325ffa531549507fcc8d53e274f3311e8b37fae966d9e8abdd763f7c0088f
+size 29360128
diff --git a/params_shard_413.bin b/params_shard_413.bin
new file mode 100644
index 0000000000000000000000000000000000000000..873372af60b9aefe8abe0ea2879eec2dd593a563
--- /dev/null
+++ b/params_shard_413.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30adffbb08ae28df98781e121570654ec767fb49e7454c9790fa3208f2e76060
+size 117440512
diff --git a/params_shard_414.bin b/params_shard_414.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a68952bbb861594509544007ab6963d979fa974b
--- /dev/null
+++ b/params_shard_414.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c12037a7e29318bb4993501cc25effa5443d2d6ea2115b6df93c1f10711f8c0
+size 24150016
diff --git a/params_shard_415.bin b/params_shard_415.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c23bd11869f0008cd452443ad771bf3df0771a51
--- /dev/null
+++ b/params_shard_415.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:834c282c5e1c47cc08beb2845ae9e36947a63d390dc16dca217d05a64a91801c
+size 41943040
diff --git a/params_shard_416.bin b/params_shard_416.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f56779b7e81d6f24bd7ec3668e7264f6703c6e2b
--- /dev/null
+++ b/params_shard_416.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a6931562e2f979470964870bcfc6019503444fab389dc9c5e92bd7962313937c
+size 33554432
diff --git a/params_shard_417.bin b/params_shard_417.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2fc5f8d9dd1fdffd1c58e63f3495b11098aaf7ff
--- /dev/null
+++ b/params_shard_417.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d62000d3120a51405ec8334173646f46118afa9657c5435f647544a2ffc5231b
+size 234881024
diff --git a/params_shard_418.bin b/params_shard_418.bin
new file mode 100644
index 0000000000000000000000000000000000000000..be01acfe8a6a9274ce7700fa0d5e718efbec1f61
--- /dev/null
+++ b/params_shard_418.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:299a5e266a4ae70fd16eedc219c30222edc8d10988ae4ce1d79990e4b266e88b
+size 29360128
diff --git a/params_shard_419.bin b/params_shard_419.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a2d2f3828e74830537ef0c4cab1adbf869445b2f
--- /dev/null
+++ b/params_shard_419.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76fa27c9d056427b73f4f901d4a8f01a06b703dfd987eccf070b4f527a151cc5
+size 117440512
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7aa405c1adcb8c951f66437e3960b4bacfd101e0
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:125f604fd54fa7d78a43559a575bd0438b7301a3a11acd11b5350210f9c12cdc
+size 24150016
diff --git a/params_shard_420.bin b/params_shard_420.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fa848926860602760d398c75546621ee5bd728b2
--- /dev/null
+++ b/params_shard_420.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4f6abe5d3bbd0d543ebdb3fca0c954a0b73ff7c69f999f55cd5156298f28bf41
+size 24150016
diff --git a/params_shard_421.bin b/params_shard_421.bin
new file mode 100644
index 0000000000000000000000000000000000000000..60b7d3e3b77d9f42737e46f26da4991b039033d7
--- /dev/null
+++ b/params_shard_421.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b245e33452ea584a3790ce0cc7599d2cc45b8e7a352572500b61c10b05159fa
+size 41943040
diff --git a/params_shard_422.bin b/params_shard_422.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6baa2172b387c8e48408193eca521f9a8e147372
--- /dev/null
+++ b/params_shard_422.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c335a8355c49fd54e1a62a39679b7b3856eca8acc3323ea3ffae4ea4b2c50383
+size 33554432
diff --git a/params_shard_423.bin b/params_shard_423.bin
new file mode 100644
index 0000000000000000000000000000000000000000..976f1e169c3e9ffbcbf30a8a415def255bc7d2b2
--- /dev/null
+++ b/params_shard_423.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:460cc7c9da7758dc2f986b7b367c6c6eaa3e72971b8866b9eebdb156555a44a0
+size 234881024
diff --git a/params_shard_424.bin b/params_shard_424.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc1a22da807286d2d63df742788907456ad1c875
--- /dev/null
+++ b/params_shard_424.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75ac8f302bf6b7b59be8b1aaaf5c5950b7bbdf89a1c44308fe60e63fcc782d0c
+size 29360128
diff --git a/params_shard_425.bin b/params_shard_425.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f3a37f4ed8963ac3856bf8ee1294998a7a9515a
--- /dev/null
+++ b/params_shard_425.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6a863ea9ba007f5e84a00a8cc5255e7f77fa29de225fc2795230683312e77aee
+size 117440512
diff --git a/params_shard_426.bin b/params_shard_426.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7c61f1ab96a1afbe2e8a5ca4f67110972b3fa86
--- /dev/null
+++ b/params_shard_426.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3e700f0155c2ef889ef4872911915ffac60a2829c926795cb9722a8998a820c
+size 24150016
diff --git a/params_shard_427.bin b/params_shard_427.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f34e83fffcd6be82238ac9ca02590de2d9c776db
--- /dev/null
+++ b/params_shard_427.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:becdc7068d5485954d05ef265548ad006d46b99c299be828592dd92269bf6fad
+size 41943040
diff --git a/params_shard_428.bin b/params_shard_428.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6f42d1ff4e8bc772ad91baa539d554631b4480e5
--- /dev/null
+++ b/params_shard_428.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d188ebcec4c1a74b5b13cfed1e124bd50000dc636b7804e92701e2bdd5dcda06
+size 33554432
diff --git a/params_shard_429.bin b/params_shard_429.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1a7642e2ce6c56899fdfe07b6c3f03b0beed15d5
--- /dev/null
+++ b/params_shard_429.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21c204f79ed82b43f7ed7813541f6965237e4b2cba39483fddadce46580d0597
+size 234881024
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..37c2160709f6589bcf2759b4e88341f875425659
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea41203ec0f76fb9776a1f434e3339d075dc4720febcb0895aad3591533b84d5
+size 41943040
diff --git a/params_shard_430.bin b/params_shard_430.bin
new file mode 100644
index 0000000000000000000000000000000000000000..02f99bc167219e9ebe26a0e881fe3cddd4943922
--- /dev/null
+++ b/params_shard_430.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bca4a8257f5309a1d340352a5a8510d6bb2f249ac55f85eff0e3cd90d1594789
+size 29360128
diff --git a/params_shard_431.bin b/params_shard_431.bin
new file mode 100644
index 0000000000000000000000000000000000000000..05ba8c78e26d77459dc4a20aea91412d3bb89121
--- /dev/null
+++ b/params_shard_431.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6261ec9fff5206d7e57dfcc68fd0e9312782978e160c33a9cf28c7822f089876
+size 117440512
diff --git a/params_shard_432.bin b/params_shard_432.bin
new file mode 100644
index 0000000000000000000000000000000000000000..69f03a1c423a935ae743bf15b1cef277d1ce8dad
--- /dev/null
+++ b/params_shard_432.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e7a5fac9fe3778deddab9e7fbb19d386a1d430e327b1e8987a187877ad97b133
+size 24150016
diff --git a/params_shard_433.bin b/params_shard_433.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fcf040a695018e139131fbaebc1ac8e56b724f49
--- /dev/null
+++ b/params_shard_433.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7099691d7f4b36ffbd922b6ba9a05aff9ffe39cdb75e2ec1503f8a4e1491eb11
+size 41943040
diff --git a/params_shard_434.bin b/params_shard_434.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b046b15bccf17120c818163da3cd310eb601462
--- /dev/null
+++ b/params_shard_434.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00555926aa4cddb69b5cee5a4e837147b534b3b79a0074947204580ba7e55ed7
+size 33554432
diff --git a/params_shard_435.bin b/params_shard_435.bin
new file mode 100644
index 0000000000000000000000000000000000000000..61018861485eb3a9bfaecb905907da59f440ee95
--- /dev/null
+++ b/params_shard_435.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0514682a2b9d4cc453ba73831522935f4bba8394c095da5c7eccf3dda03c1fd
+size 234881024
diff --git a/params_shard_436.bin b/params_shard_436.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4c1d0c11208871281d2e74c5872fba99143d5a8
--- /dev/null
+++ b/params_shard_436.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6df5262ffdd001711a8990e33099b675ea486aa8bc3b7dd6499b6e560ffdba3
+size 29360128
diff --git a/params_shard_437.bin b/params_shard_437.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8971c601dc553b37fc0bdc86f5b4fe42349d2eec
--- /dev/null
+++ b/params_shard_437.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af96578e892d5c5830cf35d127f9208ab080bb7797167f568a6ca82a7db1bb02
+size 117440512
diff --git a/params_shard_438.bin b/params_shard_438.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e972cc5a259b39cc3328734f7ce8c6a502b065e1
--- /dev/null
+++ b/params_shard_438.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:169c09efeade824ab9b3bd7d03e544cf7b78536f0f537f9d3a992e4f852f271e
+size 24150016
diff --git a/params_shard_439.bin b/params_shard_439.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1aae745e42aa470ff13cb882b984eb168939035b
--- /dev/null
+++ b/params_shard_439.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c350cbbf3ed50097ca4a0130d1ed0608e55ccf1db806ccf20dd24f0be22e021
+size 41943040
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..20c76140f4d1bca8e6aedc044ce606b89f627e85
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5310399d5dda392670e0fbcc6b4e26c055148d2ee9ecbbfd1eef85f9e2eaedc6
+size 33554432
diff --git a/params_shard_440.bin b/params_shard_440.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da2436d7d9c5504219ca84c2454ab7050738d4ce
--- /dev/null
+++ b/params_shard_440.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9e16d60c23d74573420890b598ab20d60090be67beb39d80abcd8f9748d5635
+size 33554432
diff --git a/params_shard_441.bin b/params_shard_441.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d8392632fb32830de3808a07b4211a11bc9928b
--- /dev/null
+++ b/params_shard_441.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d7f47ab9d65dec980b53e2998ca9be1bc03f00f9daf047d57054b802b18a86e3
+size 234881024
diff --git a/params_shard_442.bin b/params_shard_442.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6164943c4d58dcc3df613eb078c85989491fd14c
--- /dev/null
+++ b/params_shard_442.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d99e5630b922415de36d7b50eeca517047c09613222a7e8db97e7fa341585ea
+size 29360128
diff --git a/params_shard_443.bin b/params_shard_443.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c5479091112ad01345364c09e052e4457cb5ad30
--- /dev/null
+++ b/params_shard_443.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e36fc50f02442f58e5dfb370473fe0d58e5832a09ce82083c7edc268389119b
+size 117440512
diff --git a/params_shard_444.bin b/params_shard_444.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af47e701d0e5780472fe57491fa7f45eeb152608
--- /dev/null
+++ b/params_shard_444.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d137fd2f45370caa46fb86580b57d6742182cceb3e57939aac455a11c1c19fa
+size 24150016
diff --git a/params_shard_445.bin b/params_shard_445.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8d6f59be084196770469e49fb2753ab7d7114b78
--- /dev/null
+++ b/params_shard_445.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e76ed7075c7b1234c854c4485b115819a8f069b099f5a67bf53787da2f7dd4e4
+size 41943040
diff --git a/params_shard_446.bin b/params_shard_446.bin
new file mode 100644
index 0000000000000000000000000000000000000000..89499d5477502f251133538230df0e68879a0603
--- /dev/null
+++ b/params_shard_446.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3990e7fcba71774d559e2310e55b3bee4d66f75c453f8439bafa1226c55a89d
+size 33554432
diff --git a/params_shard_447.bin b/params_shard_447.bin
new file mode 100644
index 0000000000000000000000000000000000000000..70c7ff17265774352fc1f25efd2612b421bfd3e4
--- /dev/null
+++ b/params_shard_447.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:826809148faf2e657358be6fb41512f4dee789edaf26e7528ec8a98a14ce6781
+size 234881024
diff --git a/params_shard_448.bin b/params_shard_448.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f0bf808af91c086cee69790d8db5184e00296969
--- /dev/null
+++ b/params_shard_448.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4e59c62e6b256cb00ef56c7d1075da10418d5d9ec5f7cb7cd397060b91077c6
+size 29360128
diff --git a/params_shard_449.bin b/params_shard_449.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e5fdf0b5125e11dfed80312e5714a9387136dbcc
--- /dev/null
+++ b/params_shard_449.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:869a0c7531dbe9f4b691b42426fce942758d3bf8ce0f06da090e00ee421b0da2
+size 117440512
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76f8bcaa57b6df9af32da201df0e7d112829b402
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2376e655a461a40b39c62c8a85bc6fa3d3cb6173f5a325de5b8803f532156908
+size 234881024
diff --git a/params_shard_450.bin b/params_shard_450.bin
new file mode 100644
index 0000000000000000000000000000000000000000..812c2e9bfd05af808f399d6416bca06c617251cb
--- /dev/null
+++ b/params_shard_450.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d6fb2c7600c4fe1471934f4402818fe3ceb6103182becc1c41c7f7d463bb2ff
+size 24150016
diff --git a/params_shard_451.bin b/params_shard_451.bin
new file mode 100644
index 0000000000000000000000000000000000000000..11ca4f5639ac528e52f223046c76a7230005c2b0
--- /dev/null
+++ b/params_shard_451.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3971f8eb42f24fe2f8e9849936bfe54a6c01d5060edd2ad79739e234a9f20632
+size 41943040
diff --git a/params_shard_452.bin b/params_shard_452.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0de19a63caaa0829e0cb42b159ae3dabb59b7a86
--- /dev/null
+++ b/params_shard_452.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4dccc280cc0a3111054234289b6b2db3d58f723bb29a9b4216cbd281c367127
+size 33554432
diff --git a/params_shard_453.bin b/params_shard_453.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fff048c537f2f242693004fe4cbabd49315fa609
--- /dev/null
+++ b/params_shard_453.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9a64c6f57840c89dccb3c2521addfb08075a907aa2363e57863199c9be6b28d
+size 234881024
diff --git a/params_shard_454.bin b/params_shard_454.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d7daa581ae9a8658397a2fc4477150eb88a7f711
--- /dev/null
+++ b/params_shard_454.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:493078d5ff3c7a2f50574c8289ad9f18d4f17c14f0dd6ccc6ae30eaa34fd2417
+size 29360128
diff --git a/params_shard_455.bin b/params_shard_455.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2f5c6021aaeec4b741c4823b8415779032726e35
--- /dev/null
+++ b/params_shard_455.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:004d9445ff537bd6985d1a42bcdf349e4bf641be1228eecb53f9f604be7aec44
+size 117440512
diff --git a/params_shard_456.bin b/params_shard_456.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8e3d296991a65e2f0177fadf5c624de8d37fe5d1
--- /dev/null
+++ b/params_shard_456.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c27ad4ffe64b17b7523de059e94a88ef8615737ba221da6d35cf133d3af9a11
+size 24150016
diff --git a/params_shard_457.bin b/params_shard_457.bin
new file mode 100644
index 0000000000000000000000000000000000000000..618f10b0ee5f9923504f07530558f70192c6bd74
--- /dev/null
+++ b/params_shard_457.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fafe32661b4767d4c4563f44e59b7942c52e539a2de1f43102fef00aa1349a3c
+size 41943040
diff --git a/params_shard_458.bin b/params_shard_458.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2aa6ed93629a8e5423f1ebe1b63fd02650e1768
--- /dev/null
+++ b/params_shard_458.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9546a0d394b2998b14e181ab50dbc1a898b3d87de8a66f06885075edac7b9f1a
+size 33554432
diff --git a/params_shard_459.bin b/params_shard_459.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b14bbc069ce796664e8fdb672f56ea2636f61129
--- /dev/null
+++ b/params_shard_459.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:63d0b93b1f7e73282bff8d60ddfc52a3a58ce84ad3e24f765043b83df4ae32d7
+size 234881024
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f48f77aebfbc473b0f9e59cac90d5a55903b051
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e976f4449141b7d03be6f9ae972d9fcc696d6857180ee49d7729427dc59745da
+size 29360128
diff --git a/params_shard_460.bin b/params_shard_460.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b4ecafab6dee82d1798ba50d864deec7f6a8601
--- /dev/null
+++ b/params_shard_460.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8028b008fe1d75b723d08de5e4fd7f998b150b4587fe83e688551dfc3bcab5be
+size 29360128
diff --git a/params_shard_461.bin b/params_shard_461.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f5392f20511aa3e1e12d7f770621af77db9ce47b
--- /dev/null
+++ b/params_shard_461.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c25bec1f2ca734b5a31a8e7a4ed227cf4f5ff3124b185507b4792130358f14ec
+size 117440512
diff --git a/params_shard_462.bin b/params_shard_462.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0ac98f0515ca8b189373b91d8f4446755e4c1a57
--- /dev/null
+++ b/params_shard_462.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb67bd7ae7a87a74e3db2d54ffa0bd1b62df8357f062b5409ef3df8f25801895
+size 24150016
diff --git a/params_shard_463.bin b/params_shard_463.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c2d283a965f64d5b61b7af02008d3660e2a98ff3
--- /dev/null
+++ b/params_shard_463.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a07d4fe031b81b68697fcd272a6441ef65d8c331712f5bb53fa33a105c9b516
+size 41943040
diff --git a/params_shard_464.bin b/params_shard_464.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de289131164c65cf0379a266566a59b956336399
--- /dev/null
+++ b/params_shard_464.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:790740474f211d883cff4860849354a93ed2cfa354d88ca5e380f8e7d2b2383a
+size 33554432
diff --git a/params_shard_465.bin b/params_shard_465.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d315567a7f3c1df52994a5c59b7da77d1725db9
--- /dev/null
+++ b/params_shard_465.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a965077395ff53b0e186e982cfaa611c0d92acd045d0c24b83d5137bbf38a774
+size 234881024
diff --git a/params_shard_466.bin b/params_shard_466.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a30488c6c220722ed2ae10dfbba1be8849ace91
--- /dev/null
+++ b/params_shard_466.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf3e9657433fc41549892a2b8e11d06723e86db64beeb8c027061063dc6b447c
+size 29360128
diff --git a/params_shard_467.bin b/params_shard_467.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c6004be8287cedb93d4434160b44fc0f17df2e2
--- /dev/null
+++ b/params_shard_467.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cad21a453e9f9b2061edbbec17f49dfdec80574041e8817eb68462769d35870b
+size 117440512
diff --git a/params_shard_468.bin b/params_shard_468.bin
new file mode 100644
index 0000000000000000000000000000000000000000..52f7a61ffb6bc0f7f337848bc54baf0414b85ab7
--- /dev/null
+++ b/params_shard_468.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b4e36ff459ee2f0ffbe8f9054c8a61783ca332086cc9671acefad6947264b1d
+size 24150016
diff --git a/params_shard_469.bin b/params_shard_469.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a2059784b926c3b76c73a34a0d841de85c70d2fb
--- /dev/null
+++ b/params_shard_469.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6186079f6b4b8543b0b62c8f64e0d49186a5d6bbb079095a792bdc2b1919bcfa
+size 41943040
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca4ece0478c45844d1928c251ffaeaacaa2d5998
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:42f579628d206a8721ad9128a852c179f1c85b512c9b340169336c440c5566ea
+size 117440512
diff --git a/params_shard_470.bin b/params_shard_470.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e1709d8234e1ac71ef136c96fb675bf359873b8
--- /dev/null
+++ b/params_shard_470.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:98de088cd6db5c6f9683aaac0e5f6fc95b69f02e55571276b497269a82b07eb5
+size 33554432
diff --git a/params_shard_471.bin b/params_shard_471.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cbc999bcecad2d6bbced7ec83a5107b670345f97
--- /dev/null
+++ b/params_shard_471.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eecd63c81339fd929b50a76bc1b8586a81247fb08a8543183238848e24a9633f
+size 234881024
diff --git a/params_shard_472.bin b/params_shard_472.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0fe6e1036667679d2604bbe8601d939f259e3d78
--- /dev/null
+++ b/params_shard_472.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce3215b2d9bd180df543b21645556c666b5949003844e287ce6d5f87dd68eaee
+size 29360128
diff --git a/params_shard_473.bin b/params_shard_473.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a15aa4ce564853453bd782ff7b9ae3c44ebb9e0f
--- /dev/null
+++ b/params_shard_473.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3ed5c6f674038a16338283e3c1adbd176e5026c0553ae5946511b68da4bbcc0
+size 117440512
diff --git a/params_shard_474.bin b/params_shard_474.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f03156e2336a1a7c147eb3949c3c66d394dfc876
--- /dev/null
+++ b/params_shard_474.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b17863fccbcb91e1aaf68d5efeac269411d17be5745c4bca80ca51e1319dcb3
+size 24150016
diff --git a/params_shard_475.bin b/params_shard_475.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e1fa72c5dc777e7dc07fbb0936c1a6e4e90711f
--- /dev/null
+++ b/params_shard_475.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3e45e2541d5ce91fed40cd05132e0afb695bac9f775cbea9175c5df393b395c
+size 41943040
diff --git a/params_shard_476.bin b/params_shard_476.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6e55f20e8f9d1405126db8df0c09d8c0bf65acd2
--- /dev/null
+++ b/params_shard_476.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bbfd69174626262456333683bc82340a100adb547856ec907742bbe956e5484c
+size 33554432
diff --git a/params_shard_477.bin b/params_shard_477.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d6962df8f90ed5eceefb2b9da8c2844adad290d
--- /dev/null
+++ b/params_shard_477.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32f980bddf31d29422b410dcafe0b2e83361e2913aafdc14c6724a2c16956e57
+size 234881024
diff --git a/params_shard_478.bin b/params_shard_478.bin
new file mode 100644
index 0000000000000000000000000000000000000000..242f1495d16194d9c889d59090ab0c75d9cfc6e7
--- /dev/null
+++ b/params_shard_478.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5b0142c46a813fd7f7fdb480f8ee38121932ca6ce4b678ff9da948cb9f6ba403
+size 29360128
diff --git a/params_shard_479.bin b/params_shard_479.bin
new file mode 100644
index 0000000000000000000000000000000000000000..13072d9844e54339bd9bc9ef4e1975d279c0c722
--- /dev/null
+++ b/params_shard_479.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a79ce8968efab90184343b065ba8df65057868132cea14ca22ce2dc956f6e463
+size 117440512
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0022238ff2a1cedd0fff4fff65210edc79d2db02
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0b4f0bc56ba668589a4d6a5bc49a0613fccac48e65c6226e9edebd5ff6789710
+size 24150016
diff --git a/params_shard_480.bin b/params_shard_480.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f362dc8ae06f5378e5a1b13cbe18a3e2a1b55756
--- /dev/null
+++ b/params_shard_480.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f7258e53cf0c19b6b7a7ff7bf1a8a0c79d8b69673cf20b968de638e3cd3e297a
+size 24150016
diff --git a/params_shard_481.bin b/params_shard_481.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7c6ba144f85c5577da5f6006ec59b76ed704a4d
--- /dev/null
+++ b/params_shard_481.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41dab76d27fa298334373971884a658c876b3260ce91223700e3aff5a23f3106
+size 525336576
diff --git a/params_shard_482.bin b/params_shard_482.bin
new file mode 100644
index 0000000000000000000000000000000000000000..309cac6a171c23e5f2f4247d22b1be5b56b5ff60
--- /dev/null
+++ b/params_shard_482.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a14b602c948160cc2f0d64ef5c9a17e6369c71849e9ff34172858f4b340cd623
+size 65667072
diff --git a/params_shard_483.bin b/params_shard_483.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a07b1270fa8e18508e63fe495695e9e876e78aac
--- /dev/null
+++ b/params_shard_483.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79054a46512f69da72f7ce6f6ec956dbf6dfe365cf52ae9f376b65c2ce5eb742
+size 14729216
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c9fbbd33abe42b6941edd547c47983acd0335a2
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:145fab57d392214e8bda11d64038bbec57d5033de464582e1e4d3ff59561daf7
+size 41943040
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b0b57820dc7df7ec0c6bf4dfab9ec1dc5459fd81
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:71fb72815f490b203cb0320d503fc000c511adae7080cc6173523bf320b24941
+size 29360128
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1e43cd35ef92ce4322ae7069e4d250c6b46960ec
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:388e50140a3180e0e7649692c92d3320cbc3af4513f5a1bea4e60e428e00aeaf
+size 33554432
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d2b82f33423f70df42f3089ef08c93cf48b55c53
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:73448960ac26fa40bc02e57086d4dfb046a6b886631d5b1585696e7193300d18
+size 234881024
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa8a79d501926c46b9f661a70bc1432016633b69
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:afba736610baba6483edc944eba379ad140ca2ade47fe0aa3687168af1746c56
+size 29360128
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..159e12817e1463cd298d9e66934bef634d28442a
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dba88383884c2cad2bc3de6818139facc8a8bac29a6d10aa67b85c438031ad65
+size 117440512
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf473d0d7d5f9ae51df6f8bdd392bdfa6b05594e
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81f6e93b94137cad20b3738ac81f8c5fa48a871a154efd0001f9be9287c998ab
+size 24150016
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4ac9956d0184145af14d2e0fd7b8f31360f42ef3
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c70f563ef878eda812c905816cae02d312c218407c403ef9dc521e1de7865101
+size 41943040
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0c13be9bb346e3c87b95774fae316fbd6dacaec
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d7a49130d961e767751e63d369059433d85cef86e6c17731c1e8d995aa4c063
+size 33554432
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e01dba28e1690758af981ae5172d32ae35dd050a
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:921becddd26998f3df00a6a22bb65264cb848274937c73c4638fe64037c2fd7c
+size 234881024
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1a2c54a418ec16896dbb92e04d8194f2bcedd926
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b97204baca5fc3ff6f4ca5c48bc8c783221a25a0d080f3509da75082afdd6d1
+size 29360128
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41db69da364bc22c95571226a1e26a95c7c14e43
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94382231e469ac3978f2def4bf56e0cbdc8b283a277598c9d0ca607e012ad739
+size 117440512
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..091149be4a564fa788d4672e1aa4ddd1c3045eec
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c5188f600103fe2a3968e035650cf505a71ea607387b3d4c3afca0583169cda
+size 117440512
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a1dc21780fd3a49ab6f08c6b7797c410de6316d
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02de7398c45b9e9eff2902ad1904e74eb5af09acad8cb9744efd2cd077ec6ce1
+size 24150016
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e2143994db39c87b6ebb7d94d4b5b057ef92dc88
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dfb0ed2e212e3fae49ad745dadbc1c9afc95f9efe37bafc9b077c0500ce331ec
+size 41943040
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..65b1272546542ddad28b22055a8814dc993f9090
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89927183aaf4363bb3425c9a016fda2805e5b823314f46a5b03465c16e9855ca
+size 33554432
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c9aba455ff107fc25cea01bae368469b86c2d720
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f228ab91dcd7c9dccc99b98f1b5694accc44d545f7d939f20d47595e16ad294c
+size 234881024
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..409df1d68f888adc2cdf7f4ab33ff0a3cfb36c56
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a65df45652bf0e285a7ad269691cdb7cb480e0a87c995cdb9b7a1dc9eb7758c6
+size 29360128
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e63d8a61e183a74cca1397f70b3d037177bac46f
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67d2fd9dc58cfd5280095f154727ec55298a2c8eb25d4d3d7e960ec476bb25e2
+size 117440512
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d597fd091702ac6d72add134060816400f7f14aa
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a64ed1d5628b30bc30524f309d9eaf1ab655ed08db8dc0a7cac2b3e212e3f75
+size 24150016
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29e468c3442b3590a1a7807cce5944e18fcb98c6
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6df137b9cb77f66f55d9c4d999ccf3060dba7ada5a564d6c4d730c7edd524216
+size 41943040
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d49659bf0f02d0fca674cf373e3f12830fc1359
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83e73b43a602c5bb184fa2a979baf6814580a01ebf5919c366ef2bab0e443e7d
+size 33554432
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee541dafc5687085dbef327a8bc59dbed63575eb
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b05b9be466f2f5fea752059638b87ce7910c3483e336e7b1217525e4607949b5
+size 234881024
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e6430a5744552d5e71eeb3be02e50cc50e21433e
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe2f0567e582e49aa250a268ae122f9dc75d448b00d037995721fed17417b82b
+size 41943040
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b766c9fb2313176636b0dd06089d4f83cc482a2
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45097aa5a84e8d88c7bf1de6d120cc3f35156cbb5dfe8887a3fabb09184ee2f5
+size 29360128
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d12eb573383ce35428ea044016dca96f14fbcda
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:53be037e5e0f0c017c7deeba58df977b0a8cd7e315721cfec808e0d9e15ba506
+size 117440512
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa1f04a92e62b5ab78467d5847f65157759a78b0
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33275abe929daeb5a384e538e23a5cb6da6766388c7ee4ce1b74aa5206abd0e2
+size 24150016
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..842b2cd2fa520f0cb5aa21a82f70eb3b41b43087
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77b3257151bbe64ffea2b79028e2a6e42e80c1e8d8828dadb500d5ba618a23c0
+size 41943040
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fcb560366eee843fdcf4a411bef6702dca0cc5dd
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aff2864f521413c40baf62776627db09bc0b94fb2144c876cd914cba1fca4ce8
+size 33554432
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00c30c944d528f368da07b94afe1d4ea8de750c7
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b2ea4828005ca7b3720315973ce09b02816de7cbaef10f18603a3d87d8f9f41
+size 234881024
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e41f91921a299550f50aeedf65882812a17b4073
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89287e62b9ec3b4477ec9733f85a03fdfbff33d8edfc6cdc5f2e0cf8d0d8e060
+size 29360128
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d162bf1d6b09a4fcf4192946fa20c33ea6139b8f
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22c11d7058b029f41d92178a75206f7c110a64c0dfa470226de86c8359fc896a
+size 117440512
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f5302530e2a6bada2389dd5dc6f153ef313ce566
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f33eeb761cddbfd66944a3e9d2290a17fb5fad43e1848c857b6ce8cf7759c968
+size 24150016
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..95feabb6952ecc0ca6f8c28b41744622832af051
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f3567da16d75df2fce7be4ab61f83546ae6295ade3cd8b8d04a743102c5b67b
+size 41943040
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..114948577b6d496fba6366b73eca9ded7d35707c
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32c58288981b529b6b38dde59894b9152b6f7f4930faf2e255950bf546c16108
+size 33554432
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2a6f0bb7f39abbb41ac5fac685c0d14c464ddec0
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b22ae50d3e73120b70e3f60949cc89ac47f4d345743bfca76cc557e1e034a76d
+size 33554432
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fdd16f2194cd2263635a2a73150f7b2e9ee4234d
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ed593a29631f67f072eee6306d72064f8f080d519feb2194d36f78015c472bc8
+size 234881024
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5666a2264394cab186d3e8461bda9c530a24c247
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d22303a3a1dfbe03658405f3c62e8f8bf71ee01171d16cd56a8c2fc861d8770
+size 29360128
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06f44ad01cdc45a06914ae11441e4c24019fce25
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:679ed92d1902c1884345781278fcf04d03d0d597575db425b5e7ce7a00d54980
+size 117440512
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c10708daf9ed45633f5531e4cadb51f8e090c2d1
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7593cc624062c51dd6bee585fb712250c6ecdc8dc34e6583ec5e3b48de29ef1a
+size 24150016
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d50653e00538a3c5870aee099591a58aedeeb1e4
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1154051b1ab774e7288cdd84d24479aed8385d2b28e8b298df16fad726567e1d
+size 41943040
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c93185891e8517c8b2dfd3fdc801b47839c66db
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:97ec5934a81659bd3809c5caf2217d477536683243088815592c8c3b02a69624
+size 33554432
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30240ea2a2dccfd0958eb8f20a27e9b4d0476757
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57857c9422c2bf0676510971059765be84f02ed8251733a806b934c0e4178bfe
+size 234881024
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b3bed48adad7a0b99fd408a6dda24bd4fd7fdc3c
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2507fef940b78f9fd0c567a781640488b041bb84dd2c0edbc3f97c626cfa8fe2
+size 29360128
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..98988bd13211f9b00f14c79b251162136ec0d115
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f16cdc25e4170218288bef2be6c76e7b5f31017bc72221d8f3ec1da1911264e7
+size 117440512
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..701352e6b3672387dbe82429f96dcccdae35b93b
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:10907c4f5961e36deee7b4fddd4a6b099a6bdff1705195e596cd13c8989f2407
+size 29392896
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..695999e374f369a702c2f49cdc21aa3a0f753cd6
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c5ad0a25a2f47d77ae09f48ed5ebe3e08a265c4884c2adbd809edd662ed7ab8
+size 24150016
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6eade35d282e584612bee22600a50f037d536dae
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3751fa9af416092a6e68c212bdd480761699dc1594b8b76fbfb4fec2da9eb5c
+size 41943040
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..467d9359da511549bf4902ba55a457344bbf26c7
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6775240158fbe3b64d63e37a0e619bcdf5b641a185e0d0847af0b0043f739f1e
+size 33554432
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef588ffb1832d0636a0edb5a475ce616db4182e8
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dab054102619d34012fd5d559036c7a5f48233f1cff8fb4a8ebfb57fdc75a9d7
+size 234881024
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41c8a0d57eb3dc7fdefd440a8c9d589ce988ed67
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09769922ed6f8e5f14242fce7d775f722c6286b9f0d696b316f706b8d9b93a6b
+size 29360128
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f8a3412bcd48e978843a0b06cd190df65cc6d453
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90b638a797667b95085bb58eacda5686f887c9d70c496051cf5daa5ca382d40d
+size 117440512
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b2c1a9999d92037c159db2ad8b2fc329e56988c5
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ff2dc672e3bd48d31b847fc72b223b4eb23527e5d2a3113e792e11a6ed7c7ca
+size 24150016
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3b88a9f3c2f174aa21cd1a90c3998dd16f3cbe9
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6b5f36c4190282771828a99a69fcb51badde51d8c7b033bd30c039c23c78b1f
+size 41943040
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..529240eeced560fd364e7cfa81bf9ded56948506
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f7dcd3fcc5cc8db2b720ddbee3ac4c21c467f4f068e8a85e31fccd43493a9180
+size 33554432
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af495528f1bac221670e3e9e2a0514a1b07187de
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7242c0e6381b90d5f1d6578fb307f6cbcd9c28dfdea964759f31e955420b2fee
+size 234881024
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..e9c8e7a2359b81191c8021d0f3c5f28c67f20962
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,410509 @@
+{
+ "version": "1.0",
+ "truncation": null,
+ "padding": null,
+ "added_tokens": [
+ {
+ "id": 128000,
+ "content": "<|begin▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128001,
+ "content": "<|end▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128002,
+ "content": "<|reserved_special_token_0|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128003,
+ "content": "<|reserved_special_token_1|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128004,
+ "content": "<|finetune_right_pad_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128005,
+ "content": "<|reserved_special_token_2|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128006,
+ "content": "<|start_header_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128007,
+ "content": "<|end_header_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128008,
+ "content": "<|eom_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128009,
+ "content": "<|eot_id|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128010,
+ "content": "<|python_tag|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 128011,
+ "content": "<|User|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 128012,
+ "content": "<|Assistant|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 128013,
+ "content": "
&": 5909, + "CON": 5910, + "Ġrepl": 5911, + "Ġregular": 5912, + "Storage": 5913, + "ramework": 5914, + "Ġgoal": 5915, + "Ġtouch": 5916, + ".widget": 5917, + "Ġbuilt": 5918, + "des": 5919, + "Part": 5920, + "(re": 5921, + "Ġworth": 5922, + "hib": 5923, + "game": 5924, + "91": 5925, + "192": 5926, + "Ġв": 5927, + "acion": 5928, + "ĠWhite": 5929, + "(type": 5930, + "(`": 5931, + "81": 5932, + "Ġnatural": 5933, + "Ġinj": 5934, + "Ġcalcul": 5935, + "ĠApril": 5936, + ".List": 5937, + "Ġassociated": 5938, + "ĉSystem": 5939, + "~~": 5940, + "=[": 5941, + "Ġstorage": 5942, + "Ġbytes": 5943, + "Ġtravel": 5944, + "Ġsou": 5945, + "Ġpassed": 5946, + "!=": 5947, + "ascript": 5948, + ".open": 5949, + "Ġgrid": 5950, + "Ġbus": 5951, + "Ġrecogn": 5952, + "Ab": 5953, + "Ġhon": 5954, + "ĠCenter": 5955, + "Ġprec": 5956, + "build": 5957, + "73": 5958, + "HTML": 5959, + "ĠSan": 5960, + "Ġcountries": 5961, + "aled": 5962, + "token": 5963, + "kt": 5964, + "Ġqual": 5965, + "Last": 5966, + "adow": 5967, + "Ġmanufact": 5968, + "idad": 5969, + "jango": 5970, + "Next": 5971, + "xf": 5972, + ".a": 5973, + "Ġporno": 5974, + "ĠPM": 5975, + "erve": 5976, + "iting": 5977, + "_th": 5978, + "ci": 5979, + "=None": 5980, + "gs": 5981, + "Ġlogin": 5982, + "atives": 5983, + "']);Ċ": 5984, + "Äħ": 5985, + "Ġill": 5986, + "IA": 5987, + "children": 5988, + "DO": 5989, + "Ġlevels": 5990, + "Ġ{{": 5991, + "Ġlooks": 5992, + "Ġ\"#": 5993, + "ToString": 5994, + "Ġnecessary": 5995, + "ĠĠĠĊ": 5996, + "cell": 5997, + "Entry": 5998, + "Ġ'#": 5999, + "Ġextrem": 6000, + "Selector": 6001, + "Ġplaceholder": 6002, + "Load": 6003, + "Ġreleased": 6004, + "ORE": 6005, + "Enumer": 6006, + "ĠTV": 6007, + "SET": 6008, + "inq": 6009, + "Press": 6010, + "ĠDepartment": 6011, + "Ġproperties": 6012, + "Ġrespond": 6013, + "Search": 6014, + "ael": 6015, + "Ġrequ": 6016, + "ĠBook": 6017, + "/Ċ": 6018, + "(st": 6019, + "Ġfinancial": 6020, + "icket": 6021, + "_input": 6022, + "Ġthreat": 6023, + "(in": 6024, + "Strip": 6025, + "ìĿ": 6026, + "ção": 6027, + "71": 6028, + "Ġevidence": 6029, + "));": 6030, + "ĠBro": 6031, + "Ġ[];Ċ": 6032, + "Ġou": 6033, + "buf": 6034, + "Script": 6035, + "dat": 6036, + "Ġrule": 6037, + "#import": 6038, + "=\"/": 6039, + "Serial": 6040, + "Ġstarting": 6041, + "[index": 6042, + "ae": 6043, + "Ġcontrib": 6044, + "session": 6045, + "_new": 6046, + "utable": 6047, + "ober": 6048, + "Ġ\"./": 6049, + "Ġlogger": 6050, + "Ġrecently": 6051, + "Ġreturned": 6052, + "ččĊ": 6053, + ")))Ċ": 6054, + "itions": 6055, + "Ġseek": 6056, + "Ġcommunic": 6057, + "Ġ\".": 6058, + "Ġusername": 6059, + "ECT": 6060, + "DS": 6061, + "Ġotherwise": 6062, + "ĠGerman": 6063, + ".aw": 6064, + "Adapter": 6065, + "ixel": 6066, + "Ġsystems": 6067, + "Ġdrop": 6068, + "83": 6069, + "Ġstructure": 6070, + "Ġ$(\"#": 6071, + "encies": 6072, + "anning": 6073, + "ĠLink": 6074, + "ĠResponse": 6075, + "Ġstri": 6076, + "ż": 6077, + "ĠDB": 6078, + "æĹ": 6079, + "android": 6080, + "submit": 6081, + "otion": 6082, + "92": 6083, + "(@": 6084, + ".test": 6085, + "82": 6086, + "ĊĊĊĊĊĊĊĊ": 6087, + "];čĊ": 6088, + "Ġdirectly": 6089, + "Ġ\"%": 6090, + "ris": 6091, + "elta": 6092, + "AIL": 6093, + "){čĊ": 6094, + "mine": 6095, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 6096, + "(k": 6097, + "bon": 6098, + "asic": 6099, + "pite": 6100, + "___": 6101, + "Max": 6102, + "Ġerrors": 6103, + "ĠWhile": 6104, + "Ġarguments": 6105, + "Ġensure": 6106, + "Right": 6107, + "-based": 6108, + "Web": 6109, + "Ġ-=": 6110, + "Ġintrodu": 6111, + "ĠInst": 6112, + "ĠWash": 6113, + "ordin": 6114, + "join": 6115, + "Database": 6116, + "Ġgrad": 6117, + "Ġusually": 6118, + "ITE": 6119, + "Props": 6120, + "?>Ċ": 6121, + "ĠGo": 6122, + "@Override": 6123, + "REF": 6124, + "Ġip": 6125, + "ĠAustral": 6126, + "Ġist": 6127, + "ViewById": 6128, + "Ġserious": 6129, + "Ġcustomer": 6130, + ".prototype": 6131, + "odo": 6132, + "cor": 6133, + "Ġdoor": 6134, + "ĠWITHOUT": 6135, + "Ġplant": 6136, + "Ġbegan": 6137, + "Ġdistance": 6138, + "()).": 6139, + "Ġchance": 6140, + "Ġord": 6141, + "came": 6142, + "pragma": 6143, + "Ġprotect": 6144, + "ragment": 6145, + "ĠNode": 6146, + "ening": 6147, + "Ñĩ": 6148, + "Ġroute": 6149, + "ĠSchool": 6150, + "hi": 6151, + "Ġneighb": 6152, + "After": 6153, + "licit": 6154, + "Ġcontr": 6155, + "Ġprimary": 6156, + "AA": 6157, + ".WriteLine": 6158, + "utils": 6159, + "Ġbi": 6160, + "Red": 6161, + ".Linq": 6162, + ".object": 6163, + "Ġleaders": 6164, + "unities": 6165, + "Ġgun": 6166, + "onth": 6167, + "ĠDev": 6168, + "FILE": 6169, + "Ġcomments": 6170, + "_len": 6171, + "arrow": 6172, + "amount": 6173, + "Range": 6174, + "sert": 6175, + "GridView": 6176, + "Ġupdated": 6177, + "ĠMo": 6178, + "Ġinform": 6179, + "ociety": 6180, + "ala": 6181, + "Access": 6182, + "Ġhab": 6183, + "Ġcreat": 6184, + "_arg": 6185, + "ĠJanuary": 6186, + "ĠDay": 6187, + "\")čĊ": 6188, + "uple": 6189, + "document": 6190, + "gorith": 6191, + "menu": 6192, + "ĠOver": 6193, + "bb": 6194, + ".title": 6195, + "_out": 6196, + "Ġled": 6197, + "uri": 6198, + "Ġ?>": 6199, + "gl": 6200, + "Ġbank": 6201, + "ayment": 6202, + "ĉprintf": 6203, + "MD": 6204, + "Ġsample": 6205, + "Ġhands": 6206, + "ĠVersion": 6207, + "uario": 6208, + "Ġoffers": 6209, + "ityEngine": 6210, + "Ġshape": 6211, + "Ġsleep": 6212, + "_point": 6213, + "Settings": 6214, + "Ġachie": 6215, + "Ġsold": 6216, + "ota": 6217, + ".bind": 6218, + "Am": 6219, + "Ġsafe": 6220, + "Store": 6221, + "Ġshared": 6222, + "Ġpriv": 6223, + "_VAL": 6224, + "Ġsens": 6225, + "){": 6226, + "Ġremember": 6227, + "shared": 6228, + "element": 6229, + "Ġshoot": 6230, + "Vert": 6231, + "cout": 6232, + "Ġenv": 6233, + "_label": 6234, + "Ġ>Ċ": 6235, + "run": 6236, + "Ġscene": 6237, + "(array": 6238, + "device": 6239, + "_title": 6240, + "agon": 6241, + "]čĊ": 6242, + "aby": 6243, + "Ġbecame": 6244, + "boolean": 6245, + "Ġpark": 6246, + "ĠCode": 6247, + "upload": 6248, + "riday": 6249, + "ĠSeptember": 6250, + "Fe": 6251, + "Ġsen": 6252, + "cing": 6253, + "FL": 6254, + "Col": 6255, + "uts": 6256, + "_page": 6257, + "inn": 6258, + "Ġimplied": 6259, + "aling": 6260, + "Ġyourself": 6261, + ".Count": 6262, + "conf": 6263, + "Ġaud": 6264, + "_init": 6265, + ".)": 6266, + "Ġwrote": 6267, + "003": 6268, + "NG": 6269, + ".Error": 6270, + "ä»": 6271, + ".for": 6272, + "Ġequal": 6273, + "ĠRequest": 6274, + "Ġserial": 6275, + "Ġallows": 6276, + "XX": 6277, + "Ġmiddle": 6278, + "chor": 6279, + "195": 6280, + "94": 6281, + "ø": 6282, + "erval": 6283, + ".Column": 6284, + "reading": 6285, + "Ġescort": 6286, + "ĠAugust": 6287, + "Ġquickly": 6288, + "Ġweap": 6289, + "ĠCG": 6290, + "ropri": 6291, + "ho": 6292, + "Ġcop": 6293, + "(struct": 6294, + "ĠBig": 6295, + "Ġvs": 6296, + "Ġfrequ": 6297, + ".Value": 6298, + "Ġactions": 6299, + "Ġproper": 6300, + "Ġinn": 6301, + "Ġobjects": 6302, + "Ġmatrix": 6303, + "avascript": 6304, + "Ġones": 6305, + ".group": 6306, + "Ġgreen": 6307, + "Ġpaint": 6308, + "ools": 6309, + "ycl": 6310, + "encode": 6311, + "olt": 6312, + "comment": 6313, + ".api": 6314, + "Dir": 6315, + "Ġune": 6316, + "izont": 6317, + ".position": 6318, + "Ġdesigned": 6319, + "_val": 6320, + "avi": 6321, + "iring": 6322, + "tab": 6323, + "Ġlayer": 6324, + "Ġviews": 6325, + "Ġreve": 6326, + "rael": 6327, + "ĠON": 6328, + "rics": 6329, + "160": 6330, + "np": 6331, + "Ġcore": 6332, + "());čĊ": 6333, + "Main": 6334, + "Ġexpert": 6335, + "ĉĉčĊ": 6336, + "_en": 6337, + "Ġ/>": 6338, + "utter": 6339, + "IAL": 6340, + "ails": 6341, + "ĠKing": 6342, + "*/ĊĊ": 6343, + "ĠMet": 6344, + "_end": 6345, + "addr": 6346, + "ora": 6347, + "Ġir": 6348, + "Min": 6349, + "Ġsurpr": 6350, + "Ġrepe": 6351, + "Ġdirectory": 6352, + "PUT": 6353, + "-S": 6354, + "Ġelection": 6355, + "haps": 6356, + ".pre": 6357, + "cm": 6358, + "Values": 6359, + "Ġ\"Ċ": 6360, + "column": 6361, + "ivil": 6362, + "Login": 6363, + "inue": 6364, + "93": 6365, + "Ġbeautiful": 6366, + "Ġsecret": 6367, + "(event": 6368, + "Ġchat": 6369, + "ums": 6370, + "Ġorigin": 6371, + "Ġeffects": 6372, + "Ġmanagement": 6373, + "illa": 6374, + "tk": 6375, + "Ġsetting": 6376, + "ĠCour": 6377, + "Ġmassage": 6378, + "ĉend": 6379, + "Ġhappy": 6380, + "Ġfinish": 6381, + "Ġcamera": 6382, + "ĠVer": 6383, + "ĠDemocr": 6384, + "ĠHer": 6385, + "(Q": 6386, + "cons": 6387, + "ita": 6388, + "Ġ'.": 6389, + "{}": 6390, + "ĉC": 6391, + "Ġstuff": 6392, + "194": 6393, + "Ġ:Ċ": 6394, + "ĠAR": 6395, + "Task": 6396, + "hidden": 6397, + "eros": 6398, + "IGN": 6399, + "atio": 6400, + "ĠHealth": 6401, + "olute": 6402, + "Enter": 6403, + "'>": 6404, + "ĠTwitter": 6405, + "ĠCounty": 6406, + "scribe": 6407, + "Ġ=>Ċ": 6408, + "Ġhy": 6409, + "fit": 6410, + "Ġmilitary": 6411, + "Ġsale": 6412, + "required": 6413, + "non": 6414, + "bootstrap": 6415, + "hold": 6416, + "rim": 6417, + "-old": 6418, + "ĠDown": 6419, + "Ġmention": 6420, + "contact": 6421, + "_group": 6422, + "oday": 6423, + "Ġtown": 6424, + "Ġsolution": 6425, + "uate": 6426, + "elling": 6427, + "]->": 6428, + "otes": 6429, + "ental": 6430, + "omen": 6431, + "ospital": 6432, + "ĠSup": 6433, + "_EN": 6434, + "Ġslow": 6435, + "SESSION": 6436, + "Ġblue": 6437, + "ago": 6438, + "Ġlives": 6439, + "Ġ^": 6440, + ".un": 6441, + "inst": 6442, + "enge": 6443, + "Ġcustomers": 6444, + "Ġcast": 6445, + "udget": 6446, + "ï¼ģ": 6447, + "icens": 6448, + "Ġdetermin": 6449, + "Selected": 6450, + "_pl": 6451, + "ueue": 6452, + "Ġdark": 6453, + "//ĊĊ": 6454, + "si": 6455, + "thern": 6456, + "ĠJapan": 6457, + "/w": 6458, + "PU": 6459, + "ĠEast": 6460, + "ovie": 6461, + "Ġpackage": 6462, + "Ġnor": 6463, + "Ġapi": 6464, + "bot": 6465, + "\"];Ċ": 6466, + "_post": 6467, + "ulate": 6468, + "Ġclub": 6469, + "'));Ċ": 6470, + "Ġloop": 6471, + "PIO": 6472, + "ione": 6473, + "shot": 6474, + "Initial": 6475, + "Ġplayed": 6476, + "register": 6477, + "rought": 6478, + "_max": 6479, + "acement": 6480, + "match": 6481, + "raphics": 6482, + "AST": 6483, + "Ġexisting": 6484, + "Ġcomplex": 6485, + "DA": 6486, + ".Ch": 6487, + ".common": 6488, + "mo": 6489, + "Ġ'../../": 6490, + "ito": 6491, + "Ġanalysis": 6492, + "Ġdeliver": 6493, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6494, + "idx": 6495, + "Ãł": 6496, + "ongo": 6497, + "ĠEnglish": 6498, + "Ċ": 10197, + "_default": 10198, + "ĠDatabase": 10199, + "rep": 10200, + "ESS": 10201, + "nergy": 10202, + ".Find": 10203, + "_mask": 10204, + "Ġrise": 10205, + "Ġkernel": 10206, + "::$": 10207, + ".Q": 10208, + "Ġoffering": 10209, + "decl": 10210, + "ĠCS": 10211, + "Ġlisted": 10212, + "Ġmostly": 10213, + "enger": 10214, + "Ġblocks": 10215, + "olo": 10216, + "Ġgoverning": 10217, + "\\F": 10218, + "Ġconcent": 10219, + ".getText": 10220, + "Ġmb": 10221, + "Ġoccurred": 10222, + "Ġchanging": 10223, + "Scene": 10224, + "_CODE": 10225, + "Beh": 10226, + "\"The": 10227, + "Ġtile": 10228, + "ĠAssociation": 10229, + "ĉP": 10230, + "alty": 10231, + "_ad": 10232, + "odies": 10233, + "iated": 10234, + "Ġprepared": 10235, + "possible": 10236, + "Ġmort": 10237, + "TEST": 10238, + "142": 10239, + "Ġignore": 10240, + "Ġcalc": 10241, + "Ġrs": 10242, + "ĠassertEquals": 10243, + "Ġsz": 10244, + "ĠTHIS": 10245, + ".\"Ċ": 10246, + "Ġcanvas": 10247, + "java": 10248, + "Ġdut": 10249, + "VALID": 10250, + ".sql": 10251, + ".input": 10252, + "Ġaux": 10253, + "Sup": 10254, + "Ġartist": 10255, + "Vec": 10256, + "_TIME": 10257, + ".stringify": 10258, + "etween": 10259, + "ĠCategory": 10260, + "Ġ[-": 10261, + "ĠDevExpress": 10262, + "ĠJul": 10263, + "Ġring": 10264, + ".ed": 10265, + "YY": 10266, + "Let": 10267, + "TextField": 10268, + "Ġflat": 10269, + "_print": 10270, + "ĠOTHER": 10271, + "adian": 10272, + "Ġchecked": 10273, + "ele": 10274, + "Align": 10275, + "standing": 10276, + "Ġ[],": 10277, + "Ġlab": 10278, + "ucky": 10279, + "ĠChristmas": 10280, + "(image": 10281, + ".module": 10282, + "Ġlots": 10283, + "Ġslightly": 10284, + "(final": 10285, + "erge": 10286, + "è¿": 10287, + "147": 10288, + "ĠPolice": 10289, + "143": 10290, + "ĠRight": 10291, + "Ġaward": 10292, + "ĠOS": 10293, + "Ġ{}ĊĊ": 10294, + "Ġptr": 10295, + "oves": 10296, + "icated": 10297, + "ем": 10298, + "Ġmanage": 10299, + "oliday": 10300, + "Amount": 10301, + "oolStrip": 10302, + "tbody": 10303, + "Nav": 10304, + "wrap": 10305, + "BB": 10306, + "Ġwatching": 10307, + "arios": 10308, + "Ġoptional": 10309, + "_K": 10310, + "ĠLicensed": 10311, + ".Map": 10312, + "Timer": 10313, + "ĠAP": 10314, + "ĠRev": 10315, + "(o": 10316, + ",c": 10317, + "umin": 10318, + "etailed": 10319, + "ĠHy": 10320, + "Ġblank": 10321, + "agger": 10322, + "ĠSelf": 10323, + "()[": 10324, + ".make": 10325, + "earn": 10326, + "channel": 10327, + ";Ċ": 10342, + "World": 10343, + "Ġpython": 10344, + "Ġlif": 10345, + "Ġtrav": 10346, + "Ġconven": 10347, + "company": 10348, + "ĠClub": 10349, + "138": 10350, + "Ver": 10351, + "Btn": 10352, + "Ġzone": 10353, + "products": 10354, + "ĠEduc": 10355, + "Ġverify": 10356, + "ĠMil": 10357, + "ono": 10358, + "]);ĊĊ": 10359, + "ENCE": 10360, + "Ġpacket": 10361, + "Ġcer": 10362, + "Ġenumer": 10363, + "Ġpars": 10364, + "formed": 10365, + "Ġoccup": 10366, + "tre": 10367, + "Ġexercise": 10368, + "Day": 10369, + "_sum": 10370, + "Ġasking": 10371, + "aption": 10372, + "Ġorders": 10373, + "Ġspending": 10374, + "ĠERR": 10375, + ".Dis": 10376, + "ĠUtil": 10377, + "âĢľI": 10378, + "\\'": 10379, + "?)": 10380, + "/>Ċ": 10381, + "Ġemot": 10382, + "Ġinfluence": 10383, + "ĠAfrica": 10384, + "atters": 10385, + "Ùħ": 10386, + ".session": 10387, + "Ġchief": 10388, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10389, + "Ġtom": 10390, + "cluded": 10391, + "serial": 10392, + "_handler": 10393, + ".Type": 10394, + "aped": 10395, + "Ġpolicies": 10396, + "-ex": 10397, + "-tr": 10398, + "blank": 10399, + "merce": 10400, + "Ġcoverage": 10401, + "Ġrc": 10402, + "_matrix": 10403, + "_box": 10404, + "Ġcharges": 10405, + "ĠBoston": 10406, + "Pe": 10407, + "Ġcircum": 10408, + "Ġfilled": 10409, + "148": 10410, + "Ġnorth": 10411, + "ictureBox": 10412, + "ĉres": 10413, + "è®": 10414, + "Ġtermin": 10415, + "Ġ[âĢ¦": 10416, + "IRECT": 10417, + "Ġber": 10418, + "Ġ\"../../": 10419, + "retch": 10420, + ".code": 10421, + "_col": 10422, + "ĠGovernment": 10423, + "Ġargv": 10424, + "ĠLord": 10425, + "asi": 10426, + "Exec": 10427, + "ĉlet": 10428, + "vertis": 10429, + "Ġdiscussion": 10430, + "enance": 10431, + "outube": 10432, + "typeof": 10433, + "Ġserved": 10434, + "ĠPut": 10435, + "ĉx": 10436, + "Ġsweet": 10437, + "Before": 10438, + "ategy": 10439, + ".of": 10440, + "ĠMaterial": 10441, + "Sort": 10442, + "ONT": 10443, + "igital": 10444, + "Why": 10445, + "Ġsust": 10446, + "Ġç": 10447, + "abet": 10448, + "Ġsegment": 10449, + "Ġ[],Ċ": 10450, + "ĠMuslim": 10451, + "ĠfindViewById": 10452, + "cut": 10453, + "_TEXT": 10454, + "ĠMary": 10455, + "Ġloved": 10456, + "Ġlie": 10457, + "ĠJO": 10458, + "Ġisset": 10459, + "month": 10460, + "Ġprime": 10461, + "ti": 10462, + "ĠCarol": 10463, + "Use": 10464, + "146": 10465, + "ĠPop": 10466, + "ĠSave": 10467, + "Interval": 10468, + "execute": 10469, + "dy": 10470, + "ĠIran": 10471, + "_cont": 10472, + "ĉT": 10473, + "Ġphase": 10474, + "checkbox": 10475, + "week": 10476, + "Ġhide": 10477, + "Ġtil": 10478, + "Ġju": 10479, + "Custom": 10480, + "burg": 10481, + "/M": 10482, + "TON": 10483, + "Ġquant": 10484, + "Ġrub": 10485, + "ixels": 10486, + "Ġinstalled": 10487, + "Ġdump": 10488, + "Ġproperly": 10489, + "(List": 10490, + "Ġdecide": 10491, + "apply": 10492, + "Has": 10493, + "Ġkeeping": 10494, + "Ġcitizens": 10495, + "Ġjoint": 10496, + "pool": 10497, + "Socket": 10498, + "_op": 10499, + "Ġweapon": 10500, + "gnore": 10501, + "ĠExec": 10502, + "otten": 10503, + "ĠMS": 10504, + "Ġ(-": 10505, + "ĠReview": 10506, + "Ġexamples": 10507, + "Ġtight": 10508, + "!(": 10509, + "DP": 10510, + "ĠMessageBox": 10511, + "Ġphotograph": 10512, + "164": 10513, + "URI": 10514, + "ét": 10515, + "low": 10516, + "ĠGrand": 10517, + ".persistence": 10518, + "Ġmaintain": 10519, + "Ġnums": 10520, + "Ġzip": 10521, + "ials": 10522, + "ĠGets": 10523, + "peg": 10524, + "ĠBuffer": 10525, + "~~~~": 10526, + "rastructure": 10527, + "ĠPL": 10528, + "uen": 10529, + "obby": 10530, + "sizeof": 10531, + "Ġpic": 10532, + "Ġseed": 10533, + "Ġexperienced": 10534, + "Ġodd": 10535, + "Ġkick": 10536, + "Ġprocedure": 10537, + "avigator": 10538, + "-on": 10539, + ",j": 10540, + "ĠAlthough": 10541, + "ĠuserId": 10542, + "accept": 10543, + "Blue": 10544, + "IColor": 10545, + "layer": 10546, + "available": 10547, + "Ġends": 10548, + ".table": 10549, + "Ġdataset": 10550, + "bus": 10551, + "Ġexplain": 10552, + "(pro": 10553, + "ĠCommittee": 10554, + "Ġnoted": 10555, + "]:Ċ": 10556, + "Dim": 10557, + "stdio": 10558, + "154": 10559, + ".\",Ċ": 10560, + "_source": 10561, + "181": 10562, + "ĠWeek": 10563, + "ĠEdge": 10564, + "Ġoperating": 10565, + "Ġeste": 10566, + "ipl": 10567, + "330": 10568, + "agination": 10569, + "Ġproceed": 10570, + "Ġanimation": 10571, + ".Models": 10572, + "ĠWatch": 10573, + "iat": 10574, + "Ġoppon": 10575, + "/A": 10576, + "Report": 10577, + "Ġsounds": 10578, + "_buf": 10579, + "IELD": 10580, + "Ġbund": 10581, + "ĉget": 10582, + ".pr": 10583, + "(tmp": 10584, + "Ġkid": 10585, + ">ĊĊĊ": 10586, + "Ġyang": 10587, + "NotFound": 10588, + "ÑĨ": 10589, + "math": 10590, + "@gmail": 10591, + "ĠLIMIT": 10592, + "redients": 10593, + "Ġvent": 10594, + "avigate": 10595, + "Look": 10596, + "Ġreligious": 10597, + "Ġrand": 10598, + "rio": 10599, + "(GL": 10600, + "_ip": 10601, + "uan": 10602, + "iciency": 10603, + "ĠChange": 10604, + ">čĊčĊ": 10605, + "ĠEntity": 10606, + "Ġrencontre": 10607, + "ĠRet": 10608, + "plan": 10609, + "én": 10610, + "BOOL": 10611, + "uries": 10612, + "train": 10613, + "Definition": 10614, + "============": 10615, + "zz": 10616, + "450": 10617, + "Animation": 10618, + "ĠOK": 10619, + "_menu": 10620, + ".bl": 10621, + "_score": 10622, + "Ġacad": 10623, + "(System": 10624, + "Ġrefresh": 10625, + "'=>$": 10626, + ".Graphics": 10627, + "amento": 10628, + "pid": 10629, + "tc": 10630, + "Ġtips": 10631, + "Ġhomes": 10632, + "Ġfuel": 10633, + "âĸ": 10634, + "_helper": 10635, + "ĠĠčĊ": 10636, + "ĠRoom": 10637, + ".Close": 10638, + "_attr": 10639, + "ĠMount": 10640, + "ĠEv": 10641, + "arser": 10642, + "_top": 10643, + "eah": 10644, + "ĠDelete": 10645, + "ãĢį": 10646, + "uke": 10647, + "Ġusage": 10648, + "aria": 10649, + "_dev": 10650, + "Ġtexture": 10651, + "Ġconversation": 10652, + "eper": 10653, + "Bean": 10654, + "done": 10655, + "nonatomic": 10656, + "ĠSecond": 10657, + "Ġshooting": 10658, + "_pre": 10659, + "Components": 10660, + "Ġ]ĊĊ": 10661, + "__,": 10662, + "stitution": 10663, + ".Char": 10664, + ">();ĊĊ": 10665, + "Ġpresented": 10666, + "Ġwa": 10667, + "oker": 10668, + "-ĊĊ": 10669, + "iner": 10670, + "Ġbecoming": 10671, + "Ġincident": 10672, + "Att": 10673, + "162": 10674, + "Ġrevealed": 10675, + "forc": 10676, + "Ġboot": 10677, + ".page": 10678, + "Enumerator": 10679, + "165": 10680, + "_->": 10681, + "Photo": 10682, + "Ġspring": 10683, + ".\",": 10684, + "ĠDictionary": 10685, + "BJECT": 10686, + "Ġlocations": 10687, + "Ġsamples": 10688, + "InputStream": 10689, + "ĠBrown": 10690, + "Ġstats": 10691, + "quality": 10692, + "Ñħ": 10693, + "-dis": 10694, + "Ġhelping": 10695, + "Ġped": 10696, + "224": 10697, + "(se": 10698, + "ĠWho": 10699, + "alian": 10700, + "internal": 10701, + "Ġft": 10702, + ">().": 10703, + "->{": 10704, + "Ġmine": 10705, + "Ġsector": 10706, + "Ġgro": 10707, + "Ġopportunities": 10708, + "Ġü": 10709, + "Ġmp": 10710, + "Ġalleged": 10711, + "Ġdoubt": 10712, + "Mouse": 10713, + "About": 10714, + "_part": 10715, + "Ġchair": 10716, + "Ġstopped": 10717, + "161": 10718, + "loop": 10719, + "entities": 10720, + "Ġapps": 10721, + "ansion": 10722, + "Ġmental": 10723, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10724, + "FR": 10725, + "Ġdefend": 10726, + "care": 10727, + "Ġideal": 10728, + "/api": 10729, + "urface": 10730, + "011": 10731, + "Ġele": 10732, + "ulator": 10733, + "ĠRights": 10734, + "anguages": 10735, + "Ġfunds": 10736, + "Ġadapt": 10737, + "Attributes": 10738, + "Ġdeploy": 10739, + "opts": 10740, + "Ġvalidation": 10741, + "Ġconcerns": 10742, + "uce": 10743, + ".num": 10744, + "ulture": 10745, + "ila": 10746, + "Ġcup": 10747, + "Ġpure": 10748, + ".Fore": 10749, + "183": 10750, + "ĠHashMap": 10751, + ".valueOf": 10752, + "asm": 10753, + "MO": 10754, + "Ġcs": 10755, + "Ġstores": 10756, + "Ġ************************************************************************": 10757, + "Ġcommunication": 10758, + "mem": 10759, + ".EventHandler": 10760, + ".Status": 10761, + "_right": 10762, + ".setOn": 10763, + "Sheet": 10764, + "Ġidentify": 10765, + "enerated": 10766, + "ordered": 10767, + "Ġ\"[": 10768, + "Ġswe": 10769, + "Condition": 10770, + "ĠAccording": 10771, + "Ġprepare": 10772, + "Ġrob": 10773, + "Pool": 10774, + "Ġsport": 10775, + "rv": 10776, + "ĠRouter": 10777, + "Ġalternative": 10778, + "([]": 10779, + "ĠChicago": 10780, + "ipher": 10781, + "ische": 10782, + "ĠDirector": 10783, + "kl": 10784, + "ĠWil": 10785, + "keys": 10786, + "Ġmysql": 10787, + "Ġwelcome": 10788, + "king": 10789, + "ĠManager": 10790, + "Ġcaught": 10791, + ")}Ċ": 10792, + "Score": 10793, + "_PR": 10794, + "Ġsurvey": 10795, + "hab": 10796, + "Headers": 10797, + "ADER": 10798, + "Ġdecor": 10799, + "Ġturns": 10800, + "Ġradius": 10801, + "errupt": 10802, + "Cor": 10803, + "Ġmel": 10804, + "Ġintr": 10805, + "(q": 10806, + "ĠAC": 10807, + "amos": 10808, + "MAX": 10809, + "ĠGrid": 10810, + "ĠJesus": 10811, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10812, + ".DE": 10813, + "Ġts": 10814, + "Ġlinked": 10815, + "free": 10816, + "ĠQt": 10817, + "Ġ/**čĊ": 10818, + "Ġfaster": 10819, + "ctr": 10820, + "_J": 10821, + "DT": 10822, + ".Check": 10823, + "Ġcombination": 10824, + "Ġintended": 10825, + "-the": 10826, + "-type": 10827, + "182": 10828, + "ectors": 10829, + "ami": 10830, + "uting": 10831, + "Ġuma": 10832, + "XML": 10833, + "UCT": 10834, + "Ap": 10835, + "ĠRandom": 10836, + "Ġran": 10837, + ".sort": 10838, + "Ġsorted": 10839, + ".Un": 10840, + "401": 10841, + "_PER": 10842, + "itory": 10843, + "Ġpriority": 10844, + "ĠGal": 10845, + "ĠOld": 10846, + "hot": 10847, + "ĠDisplay": 10848, + "(sub": 10849, + "_TH": 10850, + "_Y": 10851, + "ĠCare": 10852, + "loading": 10853, + "Kind": 10854, + "_handle": 10855, + ",,": 10856, + "rase": 10857, + "_replace": 10858, + ".addEventListener": 10859, + "ĠRT": 10860, + "172": 10861, + "Ġentered": 10862, + "gers": 10863, + "Ġich": 10864, + "(start": 10865, + "205": 10866, + "/app": 10867, + "Ġbrother": 10868, + "Memory": 10869, + "Outlet": 10870, + "Ġutf": 10871, + "prec": 10872, + "Ġnavigation": 10873, + "ORK": 10874, + "Ġdst": 10875, + "Detail": 10876, + "Ġaudience": 10877, + "Ġdur": 10878, + "Ġcluster": 10879, + "unched": 10880, + "Ġ],": 10881, + "Ġcomfortable": 10882, + ".values": 10883, + "ĠTotal": 10884, + "Ġsnap": 10885, + "Ġstandards": 10886, + "Ġperformed": 10887, + "hand": 10888, + "(\"@": 10889, + "åŃ": 10890, + "Ġphil": 10891, + "ibr": 10892, + "trim": 10893, + "Ġforget": 10894, + "157": 10895, + "Ġdoctor": 10896, + ".TextBox": 10897, + "377": 10898, + "icons": 10899, + ",s": 10900, + "ĠOp": 10901, + "Sm": 10902, + "Stop": 10903, + "ĉList": 10904, + "ĉu": 10905, + "Comment": 10906, + "_VERSION": 10907, + ".Xtra": 10908, + "Person": 10909, + "rb": 10910, + "LOB": 10911, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10912, + "ĠCentral": 10913, + "270": 10914, + "ICK": 10915, + "raq": 10916, + "Ġputting": 10917, + "Ġmd": 10918, + "ĠLove": 10919, + "Program": 10920, + "Border": 10921, + "oor": 10922, + "Ġallowing": 10923, + "after": 10924, + "Ġentries": 10925, + "ĠMaybe": 10926, + "]).": 10927, + "ĠShort": 10928, + ")\\": 10929, + ".now": 10930, + "friend": 10931, + "Ġprefer": 10932, + "ĠGPIO": 10933, + "osis": 10934, + "ĠGameObject": 10935, + "Ġskip": 10936, + "Ġcompetition": 10937, + "_match": 10938, + "lications": 10939, + "_CONT": 10940, + ".groupBox": 10941, + "Ġals": 10942, + "666": 10943, + "\"We": 10944, + "_eq": 10945, + "lan": 10946, + "_search": 10947, + "ĠMusic": 10948, + "asis": 10949, + "Ġbind": 10950, + "ĠIsland": 10951, + "rum": 10952, + "(E": 10953, + "Ġseat": 10954, + "Video": 10955, + "Ġack": 10956, + "reek": 10957, + "={()": 10958, + "Ġrating": 10959, + "Ġrestaurant": 10960, + "456": 10961, + "DEX": 10962, + "(buf": 10963, + "pping": 10964, + "uality": 10965, + "Ġleague": 10966, + "176": 10967, + "Ġfocused": 10968, + "apon": 10969, + "$data": 10970, + "CLUD": 10971, + "CLUDING": 10972, + "Ġabsolute": 10973, + "(query": 10974, + "Ġtells": 10975, + "Ang": 10976, + "Ġcommunities": 10977, + "Ġhonest": 10978, + "oking": 10979, + "Ġapart": 10980, + "arity": 10981, + "/$": 10982, + "_module": 10983, + "ĠEnc": 10984, + ".an": 10985, + ".Config": 10986, + "Cre": 10987, + "Ġshock": 10988, + "ĠArab": 10989, + "IENT": 10990, + "/re": 10991, + "Ġretrie": 10992, + "ycler": 10993, + "isa": 10994, + "ĠOrgan": 10995, + ".graph": 10996, + "Ġí": 10997, + "ĠBAS": 10998, + "Enum": 10999, + "Ġpossibly": 11000, + "ÑĢаÐ": 11001, + "ĠJapanese": 11002, + "Ġcraft": 11003, + "ĠPlace": 11004, + "Ġtalent": 11005, + "Ġfunding": 11006, + "Ġconfirmed": 11007, + "Ġcycle": 11008, + "/x": 11009, + "GE": 11010, + "Ġhearing": 11011, + "Ġplants": 11012, + "Ġmouth": 11013, + "pages": 11014, + "oria": 11015, + "ĠRemove": 11016, + "_total": 11017, + "Ġod": 11018, + "ollapse": 11019, + "door": 11020, + "Ġbought": 11021, + "Ġaddr": 11022, + "ARCH": 11023, + "_dim": 11024, + "dden": 11025, + "Ġdecades": 11026, + "REQUEST": 11027, + "Ġversions": 11028, + "fire": 11029, + "006": 11030, + "Ġmoves": 11031, + "fb": 11032, + "Ġcoffee": 11033, + ".connect": 11034, + "ĠRow": 11035, + "Ġschema": 11036, + "Scope": 11037, + "-Type": 11038, + "Ġfighting": 11039, + "Ġretail": 11040, + "Ġmodified": 11041, + "TF": 11042, + "Files": 11043, + "nie": 11044, + "_command": 11045, + "stone": 11046, + "ĠÑĤ": 11047, + "_thread": 11048, + "Ġbond": 11049, + "ĠDevelopment": 11050, + "Ġpt": 11051, + "FORM": 11052, + "plet": 11053, + "Ġidentified": 11054, + "cpp": 11055, + "206": 11056, + "225": 11057, + "Ġcoding": 11058, + "oked": 11059, + "ĠMaster": 11060, + "IDTH": 11061, + "Ġresidents": 11062, + "redit": 11063, + "ĠPhoto": 11064, + "=-": 11065, + "unte": 11066, + "ateur": 11067, + "159": 11068, + "_STATE": 11069, + "ĠSing": 11070, + "Ġsheet": 11071, + ".val": 11072, + "orse": 11073, + "Ġhers": 11074, + "Ġdetermined": 11075, + "Common": 11076, + "Ġwed": 11077, + "_queue": 11078, + "PH": 11079, + "ĠAtl": 11080, + "cred": 11081, + "/LICENSE": 11082, + "Ġmes": 11083, + "Ġadvanced": 11084, + ".java": 11085, + ".Sh": 11086, + "Go": 11087, + "kill": 11088, + "fp": 11089, + "_settings": 11090, + "Ġpal": 11091, + "Ġtruck": 11092, + "Ġcombined": 11093, + "Ġ\"${": 11094, + "ĠCorpor": 11095, + "Ġjoined": 11096, + "ĠJose": 11097, + "ĠCup": 11098, + "uns": 11099, + "estival": 11100, + "levision": 11101, + "Ġbroken": 11102, + "Ġmarriage": 11103, + "ĠWestern": 11104, + "Ġrepresents": 11105, + "ĠTitle": 11106, + "Ġss": 11107, + ".Ass": 11108, + "ongoose": 11109, + "iento": 11110, + "<>();Ċ": 11111, + "Ġabsolutely": 11112, + "Ġsmooth": 11113, + "TERN": 11114, + "ĠUnless": 11115, + "Word": 11116, + "Ġmerge": 11117, + "igan": 11118, + "ĠVol": 11119, + "Ġnn": 11120, + ".getId": 11121, + "Ġз": 11122, + "171": 11123, + "Ġsexy": 11124, + "Ġseeking": 11125, + "Single": 11126, + ".this": 11127, + "179": 11128, + "Ġkom": 11129, + "bound": 11130, + ";\"": 11131, + "ĠfontSize": 11132, + "_df": 11133, + "Ġinjury": 11134, + "(H": 11135, + "Ġissued": 11136, + "_END": 11137, + ":self": 11138, + "020": 11139, + "Ġpatch": 11140, + "Ġleaves": 11141, + "Ġadopt": 11142, + "FileName": 11143, + "ãĢIJ": 11144, + "Ġexecutive": 11145, + "ĠByte": 11146, + "]))Ċ": 11147, + "Ġnu": 11148, + "outing": 11149, + "cluding": 11150, + "-R": 11151, + ".options": 11152, + "Ġsubstant": 11153, + "avax": 11154, + "ĠBUT": 11155, + "Ġtechnical": 11156, + "Ġtwice": 11157, + "Ġmás": 11158, + "Ġunivers": 11159, + "yr": 11160, + "Ġdrag": 11161, + "ĠDC": 11162, + "Ġsed": 11163, + "Ġbot": 11164, + "ĠPal": 11165, + "ĠHall": 11166, + "forcement": 11167, + "Ġauch": 11168, + ".mod": 11169, + "notation": 11170, + "_files": 11171, + ".line": 11172, + "_flag": 11173, + "[name": 11174, + "Ġresolution": 11175, + "Ġbott": 11176, + "(\"[": 11177, + "ende": 11178, + "(arr": 11179, + "Free": 11180, + "(@\"": 11181, + "ĠDistrict": 11182, + "PEC": 11183, + ":-": 11184, + "Picker": 11185, + "ĠJo": 11186, + "ĠĠĠĠĠĊ": 11187, + "ĠRiver": 11188, + "_rows": 11189, + "Ġhelpful": 11190, + "Ġmassive": 11191, + "---Ċ": 11192, + "Ġmeasures": 11193, + "007": 11194, + "ĠRuntime": 11195, + "Ġworry": 11196, + "ĠSpec": 11197, + "ĉD": 11198, + "ãĢij": 11199, + "Ġ){Ċ": 11200, + "Ġworse": 11201, + "(filename": 11202, + "Ġlay": 11203, + "Ġmagic": 11204, + "ĠTheir": 11205, + "oul": 11206, + "stroy": 11207, + "ĠWhere": 11208, + "280": 11209, + "Ġsudden": 11210, + "Ġdefe": 11211, + "Ġbinding": 11212, + "Ġflight": 11213, + "ĠOnInit": 11214, + "ĠWomen": 11215, + "ĠPolicy": 11216, + "Ġdrugs": 11217, + "ishing": 11218, + "('../": 11219, + "ĠMel": 11220, + "peat": 11221, + "tor": 11222, + "Ġproposed": 11223, + "Ġstated": 11224, + "_RES": 11225, + "Ġeast": 11226, + "212": 11227, + "ĠCONDITION": 11228, + "_desc": 11229, + "Ġwinning": 11230, + "folio": 11231, + "Mapper": 11232, + "ĠPan": 11233, + "ĠAnge": 11234, + ".servlet": 11235, + "Ġcopies": 11236, + "LM": 11237, + "Ġvm": 11238, + "åį": 11239, + "Ġdictionary": 11240, + "Seg": 11241, + "177": 11242, + "elines": 11243, + "ĠSend": 11244, + "Ġiron": 11245, + "ĠFort": 11246, + "166": 11247, + ".domain": 11248, + "Ġdebate": 11249, + "NotNull": 11250, + "eq": 11251, + "acher": 11252, + "lf": 11253, + "ĉfmt": 11254, + "Ġlawy": 11255, + "178": 11256, + "ÄŁ": 11257, + "ĠMen": 11258, + "Ġtrim": 11259, + "(NULL": 11260, + "Ġ!!": 11261, + "Ġpad": 11262, + "Ġfollows": 11263, + "\"][\"": 11264, + "requ": 11265, + "ĠEp": 11266, + ".github": 11267, + "(img": 11268, + "eto": 11269, + "('\\": 11270, + "Services": 11271, + "umbnail": 11272, + "_main": 11273, + "pleted": 11274, + "fortunately": 11275, + "Ġwindows": 11276, + "Ġplane": 11277, + "ĠConnection": 11278, + ".local": 11279, + "uard": 11280, + "}\\": 11281, + "==\"": 11282, + "andon": 11283, + "ĠRoy": 11284, + "west": 11285, + "158": 11286, + "iginal": 11287, + "emies": 11288, + "itz": 11289, + "'):Ċ": 11290, + "ĠPeter": 11291, + "Ġtough": 11292, + "Ġreduced": 11293, + "Ġcalculate": 11294, + "Ġrapid": 11295, + "customer": 11296, + "Ġefficient": 11297, + "Ġmedium": 11298, + "Ġfell": 11299, + ".ref": 11300, + "ĠCas": 11301, + "Ġfeedback": 11302, + "Speed": 11303, + "(output": 11304, + "aje": 11305, + "Ġcategories": 11306, + "Ġfee": 11307, + "};": 11308, + "Ġdeleted": 11309, + "reh": 11310, + "Ġproof": 11311, + "Desc": 11312, + "Build": 11313, + "Ġsides": 11314, + ".ArrayList": 11315, + "-%": 11316, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11317, + "ر": 11318, + ".match": 11319, + "ли": 11320, + "Ġfeels": 11321, + "Ġachieve": 11322, + "Ġclim": 11323, + "_ON": 11324, + "ĠCD": 11325, + "Ġteacher": 11326, + "_current": 11327, + "bn": 11328, + "_PL": 11329, + "isting": 11330, + "Enable": 11331, + "GEN": 11332, + "Ġtv": 11333, + "Ġsock": 11334, + "Ġplays": 11335, + "Ġdiscount": 11336, + "ĠKE": 11337, + "ĠDebug": 11338, + "Fore": 11339, + "ĠIraq": 11340, + "Ġappearance": 11341, + "Mon": 11342, + "Ġstyled": 11343, + "ĠHuman": 11344, + "iot": 11345, + "ĠHistory": 11346, + "Ġsac": 11347, + "ĠCollection": 11348, + "Ġrecommended": 11349, + ".Selected": 11350, + "Ġorganizations": 11351, + "Ġdiscovered": 11352, + "cohol": 11353, + "adas": 11354, + "ĠThomas": 11355, + "May": 11356, + "Ġconserv": 11357, + "Ġdomin": 11358, + "ĠFollow": 11359, + "ĠSection": 11360, + "ĠThanks": 11361, + "Username": 11362, + "Ġrecipe": 11363, + "Ġwonderful": 11364, + ".sleep": 11365, + "_if": 11366, + "ĉĊĉĊ": 11367, + "orno": 11368, + "Ġru": 11369, + "_target": 11370, + ".\"\"": 11371, + "à¦": 11372, + "EventArgs": 11373, + "Ġinputs": 11374, + "Ġfif": 11375, + "Ġvision": 11376, + "cy": 11377, + "ĠSeries": 11378, + ")(((": 11379, + "Ġtrading": 11380, + "Ġmarker": 11381, + "Begin": 11382, + "Ġtypically": 11383, + "Ġcauses": 11384, + "dropdown": 11385, + "_DEBUG": 11386, + "260": 11387, + "Ġdetect": 11388, + "country": 11389, + "!\");Ċ": 11390, + "ĉR": 11391, + "appy": 11392, + "Ġcref": 11393, + "('<": 11394, + "\"=>": 11395, + "ĠLE": 11396, + "reader": 11397, + "Ġadministr": 11398, + "õ": 11399, + "ucket": 11400, + "Ġfashion": 11401, + ".char": 11402, + "izar": 11403, + "Ġdisable": 11404, + "Ġsuc": 11405, + "ĠLive": 11406, + "issue": 11407, + "Ġmetadata": 11408, + "flags": 11409, + "ĠðŁ": 11410, + "Ġcommitted": 11411, + "Ġva": 11412, + "Ġrough": 11413, + "Ġ'''Ċ": 11414, + "Ġhighlight": 11415, + "_vars": 11416, + "VO": 11417, + "Ġencoding": 11418, + "-Z": 11419, + "_sign": 11420, + "$(\"#": 11421, + "Ġrain": 11422, + "reatest": 11423, + "ĠEND": 11424, + "Selection": 11425, + "Ġcandidates": 11426, + "Ġsav": 11427, + ".Empty": 11428, + "Ġdecisions": 11429, + "Ġcollabor": 11430, + "ridge": 11431, + "feed": 11432, + "ression": 11433, + "Ġpersons": 11434, + "VM": 11435, + "008": 11436, + "ega": 11437, + "_BIT": 11438, + "According": 11439, + "acked": 11440, + "Ġdollars": 11441, + "_loss": 11442, + "ĠCost": 11443, + "}\"Ċ": 11444, + "Notification": 11445, + "Ġprostit": 11446, + "Ġauthority": 11447, + ".rec": 11448, + "Ġspokes": 11449, + "ĠToday": 11450, + "istant": 11451, + "ĠHead": 11452, + "âĢĿ.": 11453, + "ertainment": 11454, + "cean": 11455, + "culate": 11456, + "Ġven": 11457, + "However": 11458, + "_arr": 11459, + "Ġtokens": 11460, + "Graph": 11461, + "ĠJud": 11462, + "ĠVirgin": 11463, + "ĠSerial": 11464, + "unning": 11465, + "Mutable": 11466, + "agers": 11467, + ".csv": 11468, + "Ġdeveloping": 11469, + "Ġinstructions": 11470, + "Ġpromise": 11471, + "Ġrequested": 11472, + "_encode": 11473, + "/\"": 11474, + "ĠIcon": 11475, + "uilt": 11476, + "-day": 11477, + "Ġintelligence": 11478, + ".IS": 11479, + "ĠObservable": 11480, + "ĠHard": 11481, + "Bool": 11482, + "211": 11483, + "idential": 11484, + ".Anchor": 11485, + "Ġselling": 11486, + "CI": 11487, + "AGES": 11488, + "tle": 11489, + "bur": 11490, + "UFFER": 11491, + "RY": 11492, + "Ġbigger": 11493, + "Ġrat": 11494, + "Ġfamous": 11495, + "Ġtypename": 11496, + "Ġexplained": 11497, + "}}Ċ": 11498, + "Ġnuclear": 11499, + "-N": 11500, + "Ġcrisis": 11501, + "ĠEnter": 11502, + "Ġanswers": 11503, + "/${": 11504, + "/pl": 11505, + "Ġsequ": 11506, + "_next": 11507, + "mask": 11508, + "Ġstanding": 11509, + "Ġplenty": 11510, + "ĠCross": 11511, + "ĉret": 11512, + "dro": 11513, + "ĠCast": 11514, + "167": 11515, + "=true": 11516, + "ĠChris": 11517, + "icio": 11518, + "ĠMike": 11519, + "Decimal": 11520, + "addComponent": 11521, + "Len": 11522, + "Ġcock": 11523, + "Ġ#{": 11524, + "URN": 11525, + "": 11657, + "Ġ*=": 11658, + "ĠPS": 11659, + "Ġdangerous": 11660, + "[p": 11661, + "OME": 11662, + "Other": 11663, + "ĠStringBuilder": 11664, + "Points": 11665, + "heading": 11666, + "Ġcurrency": 11667, + "Ġpercentage": 11668, + "_API": 11669, + "Ġclassic": 11670, + "thead": 11671, + "ĠMO": 11672, + "FE": 11673, + "Idx": 11674, + "await": 11675, + "Ġè": 11676, + "Ġaccident": 11677, + "Ġvariant": 11678, + "Ġmyst": 11679, + "ĠLand": 11680, + "ĠBre": 11681, + "Ġharm": 11682, + "ĠAcc": 11683, + "Ġcharged": 11684, + "iones": 11685, + "Visibility": 11686, + "arry": 11687, + "ĠLanguage": 11688, + "Ġwalking": 11689, + "\".ĊĊ": 11690, + "ifer": 11691, + "Ġleadership": 11692, + ".From": 11693, + "ynam": 11694, + "Ġtimestamp": 11695, + "ipt": 11696, + "ĠHas": 11697, + "REFER": 11698, + "ĠIts": 11699, + "Ġlistener": 11700, + "UTE": 11701, + "213": 11702, + "_description": 11703, + "Ġexperiences": 11704, + "Ġcreates": 11705, + "RS": 11706, + "cart": 11707, + "black": 11708, + "Ġchoices": 11709, + "war": 11710, + "750": 11711, + "Ġ'''": 11712, + "Ġordered": 11713, + "Ġevening": 11714, + "Ġpil": 11715, + "Ġtun": 11716, + "ĠBad": 11717, + "(app": 11718, + "random": 11719, + "Ġexplicit": 11720, + "Ġarrived": 11721, + "Ġfly": 11722, + "Ġeconom": 11723, + "-mail": 11724, + "Ġlists": 11725, + "Ġarchitect": 11726, + "234": 11727, + "ĠPay": 11728, + "Ġds": 11729, + "ĠSol": 11730, + "Ġvehicles": 11731, + "Hz": 11732, + "-com": 11733, + "Ġking": 11734, + "_equal": 11735, + "ĠHelp": 11736, + "Ġabuse": 11737, + "480": 11738, + "169": 11739, + "--;Ċ": 11740, + "Ġextr": 11741, + "Ġchemical": 11742, + "ä¿": 11743, + "Ġorient": 11744, + "Ġbreath": 11745, + "ĠSpace": 11746, + "(element": 11747, + "wait": 11748, + "DED": 11749, + "igma": 11750, + "Ġentr": 11751, + "Ġsob": 11752, + "-name": 11753, + "Ġaffected": 11754, + "ika": 11755, + "Ġcoal": 11756, + "_work": 11757, + "Ġhundreds": 11758, + "Ġpolitics": 11759, + "subject": 11760, + "Ġconsumer": 11761, + "ANGE": 11762, + "Ġrepeated": 11763, + "Send": 11764, + "Ġ#[": 11765, + "Ġprotocol": 11766, + "Ġleads": 11767, + "useum": 11768, + "Every": 11769, + "808": 11770, + "174": 11771, + "Import": 11772, + "(count": 11773, + "Ġchallenges": 11774, + "Ġnovel": 11775, + "Ġdepart": 11776, + "bits": 11777, + ".Current": 11778, + "Ġ`${": 11779, + "oting": 11780, + "(\\": 11781, + "Ġcreative": 11782, + "Ġbuff": 11783, + "Ġintroduced": 11784, + "usic": 11785, + "modules": 11786, + "Are": 11787, + "-doc": 11788, + "language": 11789, + "_cache": 11790, + "Ġtod": 11791, + "?>": 11792, + "omething": 11793, + "Ġhun": 11794, + "åº": 11795, + "aters": 11796, + "Intent": 11797, + "Ġimplemented": 11798, + "ĠCase": 11799, + "Children": 11800, + "Ġnotification": 11801, + "Renderer": 11802, + "Wrapper": 11803, + "Objects": 11804, + "tl": 11805, + ".Contains": 11806, + "Plugin": 11807, + ".row": 11808, + "Ġforg": 11809, + "Ġpermit": 11810, + "Ġtargets": 11811, + "ĠIF": 11812, + "Ġtip": 11813, + "sex": 11814, + "Ġsupports": 11815, + "Ġfold": 11816, + "photo": 11817, + "},čĊ": 11818, + "Ġgoogle": 11819, + "$('#": 11820, + "Ġsharing": 11821, + "Ġgoods": 11822, + "vs": 11823, + "ĠDan": 11824, + "Rate": 11825, + "ĠMartin": 11826, + "Ġmanner": 11827, + "lie": 11828, + ".The": 11829, + "Internal": 11830, + "ĠCONTR": 11831, + "Mock": 11832, + "RIGHT": 11833, + "Ġ'{": 11834, + "Ġcontrols": 11835, + "Mat": 11836, + "Ġmand": 11837, + "Ġextended": 11838, + "Ok": 11839, + "Ġembed": 11840, + "Ġplanet": 11841, + "ĠNon": 11842, + "-ch": 11843, + ")\",": 11844, + "epar": 11845, + "Ġbelieved": 11846, + "ĠEnvironment": 11847, + "ĠFriend": 11848, + "-res": 11849, + "Ġhandling": 11850, + "nic": 11851, + "-level": 11852, + "scri": 11853, + "Xml": 11854, + "BE": 11855, + "ungen": 11856, + "Ġalter": 11857, + "[idx": 11858, + "Pop": 11859, + "cam": 11860, + "Ġ(((": 11861, + "Ġshipping": 11862, + "Ġbattery": 11863, + "iddleware": 11864, + "MC": 11865, + "Ġimpl": 11866, + "otation": 11867, + "ĠLab": 11868, + "